about summary refs log tree commit diff
diff options
context:
space:
mode:
authorDominik Maier <domenukk@gmail.com>2020-01-13 23:52:48 +0100
committerGitHub <noreply@github.com>2020-01-13 23:52:48 +0100
commit88d9fba4c7dc757284b244387fc1481676e74bd7 (patch)
tree1a9adc5c8b890ac82a036a87fa30429b600524e1
parent7b02847cd6fa50c4083b0a9985bd85cec8288808 (diff)
downloadafl++-88d9fba4c7dc757284b244387fc1481676e74bd7.tar.gz
C example added
-rw-r--r--unicorn_mode/samples/c/.gitignore2
-rw-r--r--unicorn_mode/samples/c/COMPILE.md22
-rw-r--r--unicorn_mode/samples/c/Makefile42
-rw-r--r--unicorn_mode/samples/c/a.outbin0 -> 17184 bytes
-rw-r--r--unicorn_mode/samples/c/harness.c334
-rw-r--r--unicorn_mode/samples/c/sample_all.sh18
-rw-r--r--unicorn_mode/samples/c/sample_inputs/sample1.bin1
-rw-r--r--unicorn_mode/samples/c/sample_inputs/sample2.binbin0 -> 1 bytes
-rw-r--r--unicorn_mode/samples/c/sample_inputs/sample3.bin1
-rw-r--r--unicorn_mode/samples/c/sample_inputs/sample4.bin1
-rw-r--r--unicorn_mode/samples/c/sample_inputs/sample5.bin1
-rw-r--r--unicorn_mode/samples/c/simple_target.c34
-rw-r--r--unicorn_mode/samples/c/simple_target_x86_64bin0 -> 17624 bytes
13 files changed, 456 insertions, 0 deletions
diff --git a/unicorn_mode/samples/c/.gitignore b/unicorn_mode/samples/c/.gitignore
new file mode 100644
index 00000000..9f744ae5
--- /dev/null
+++ b/unicorn_mode/samples/c/.gitignore
@@ -0,0 +1,2 @@
+harness
+harness-debug
diff --git a/unicorn_mode/samples/c/COMPILE.md b/unicorn_mode/samples/c/COMPILE.md
new file mode 100644
index 00000000..7857e5bf
--- /dev/null
+++ b/unicorn_mode/samples/c/COMPILE.md
@@ -0,0 +1,22 @@
+# C Sample
+
+This shows a simple harness for unicornafl in C
+
+## Compiling sample.c
+
+The target can be built using the `make` command.
+Just make sure you have built unicorn support first:
+```bash
+cd /path/to/afl/unicorn_mode
+./build_unicorn_support.sh
+```
+
+## Compiling simple_target.c
+
+You shouldn't need to compile simple_target.c since a X86_64 binary version is
+pre-built and shipped in this sample folder. This file documents how the binary
+was built in case you want to rebuild it or recompile it for any reason.
+
+The pre-built binary (simple_target_x86_64.bin) was built using -g -O0 in gcc.
+
+We then load the binary and execute the main function directly.
diff --git a/unicorn_mode/samples/c/Makefile b/unicorn_mode/samples/c/Makefile
new file mode 100644
index 00000000..fe100490
--- /dev/null
+++ b/unicorn_mode/samples/c/Makefile
@@ -0,0 +1,42 @@
+# UnicornAFL Usage
+# Original Unicorn Example Makefile by Nguyen Anh Quynh <aquynh@gmail.com>, 2015
+# Adapted for AFL++ by domenukk <domenukk@gmail.com>, 2020
+
+UNAME_S := $(shell uname -s)
+
+LIBDIR = ../../unicornafl
+BIN_EXT =
+AR_EXT = a
+
+# Verbose output?
+V ?= 0
+
+CFLAGS += -Wall -Werror -I../../unicornafl/include
+
+LDFLAGS += -L$(LIBDIR) -lpthread -lm
+ifeq ($(UNAME_S), Linux)
+LDFLAGS += -lrt
+endif
+
+ifneq ($(CROSS),)
+CC = $(CROSS)gcc
+endif
+
+.PHONY: all clean
+
+all: harness
+
+clean:		
+	rm -rf *.o harness harness-debug
+
+harness.o: harness.c ../../unicornafl/include/unicorn/*.h
+	${CC} ${CFLAGS} -O3 -c $<
+
+harness-debug.o: harness.c ../../unicornafl/include/unicorn/*.h
+	${CC} ${CFLAGS} -g -c $< -o $@
+
+harness: harness.o
+	${CC} -L${LIBDIR} $< ../../unicornafl/libunicornafl.a $(LDFLAGS) -o $@
+
+debug: harness-debug.o
+	${CC} -L${LIBDIR} $< ../../unicornafl/libunicornafl.a $(LDFLAGS) -o harness-debug
diff --git a/unicorn_mode/samples/c/a.out b/unicorn_mode/samples/c/a.out
new file mode 100644
index 00000000..176c25e1
--- /dev/null
+++ b/unicorn_mode/samples/c/a.out
Binary files differdiff --git a/unicorn_mode/samples/c/harness.c b/unicorn_mode/samples/c/harness.c
new file mode 100644
index 00000000..b928226b
--- /dev/null
+++ b/unicorn_mode/samples/c/harness.c
@@ -0,0 +1,334 @@
+/*
+   Simple test harness for AFL++'s unicornafl c mode.
+
+   This loads the simple_target.bin binary (precompiled as MIPS code) into
+   Unicorn's memory map for emulation, places the specified input into
+   simple_target's buffer (hardcoded to be at 0x300000), and executes 'main()'.
+   If any crashes occur during emulation, this script throws a matching signal
+   to tell AFL that a crash occurred.
+
+   Run under AFL as follows:
+
+   $ cd <afl_path>/unicorn_mode/samples/simple/
+   $ make
+<<<<<<< HEAD
+   $ ../../../afl-fuzz -m none -i sample_inputs -o out -- ./harness @@
+=======
+   $ ../../../afl-fuzz -U -m none -i ./sample_inputs -o ./output -- harness @@ 
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+*/
+
+// This is not your everyday Unicorn.
+#define UNICORN_AFL
+
+#include <string.h>
+#include <inttypes.h>
+#include <stdint.h>
+#include <stdbool.h>
+#include <unistd.h>
+#include <sys/stat.h>
+#include <fcntl.h>
+#include <sys/mman.h>
+
+#include <unicorn/unicorn.h>
+
+// Path to the file containing the binary to emulate
+<<<<<<< HEAD
+#define BINARY_FILE ("simple_target_x86_64")
+
+// Memory map for the code to be tested
+// Arbitrary address where code to test will be loaded
+#define BASE_ADDRESS (0x100000)
+#define CODE_ADDRESS (0x101119)
+#define END_ADDRESS  (0x1011d7)
+// Address of the stack (Some random address again)
+#define STACK_ADDRESS (((int64_t) 0x01) << 58)
+// Size of the stack (arbitrarily chosen, just make it big enough)
+#define STACK_SIZE (0x10000)  
+// Location where the input will be placed (make sure the emulated program knows this somehow, too ;) )
+#define INPUT_LOCATION (0x10000)
+// Inside the location, we have an ofset in our special case
+#define INPUT_OFFSET (0x16) 
+// Maximum allowable size of mutated data from AFL
+#define INPUT_SIZE_MAX (0x10000)  
+// Alignment for unicorn mappings (seems to be needed)
+#define ALIGNMENT ((uint64_t) 0x1000)
+=======
+#define BINARY_FILE ("simple_target.bin")
+
+// Memory map for the code to be tested
+// Arbitrary address where code to test will be loaded
+#define CODE_ADDRESS  (0x00100000) 
+// Max size for the code (64kb)
+#define STACK_ADDRESS (0x00200000)  
+// Size of the stack (arbitrarily chosen)
+#define STACK_SIZE	  (0x00010000)  
+// Address where mutated data will be placed
+#define DATA_ADDRESS  (0x00300000)  
+// Maximum allowable size of mutated data
+#define DATA_SIZE_MAX (0x00010000)  
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+
+static void hook_block(uc_engine *uc, uint64_t address, uint32_t size, void *user_data) {
+    printf(">>> Tracing basic block at 0x%"PRIx64 ", block size = 0x%x\n", address, size);
+}
+
+static void hook_code(uc_engine *uc, uint64_t address, uint32_t size, void *user_data)
+{
+    printf(">>> Tracing instruction at 0x%"PRIx64 ", instruction size = 0x%x\n", address, size);
+}
+
+<<<<<<< HEAD
+/* Unicorn page needs to be 0x1000 aligned, apparently */
+static uint64_t pad(uint64_t size) {
+    if (size % ALIGNMENT == 0) return size;
+    return ((size / ALIGNMENT) + 1) * ALIGNMENT;
+} 
+
+/* returns the filesize in bytes, -1 or error. */
+static off_t afl_mmap_file(char *filename, char **buf_ptr) {
+
+    off_t ret = -1;
+=======
+/* returns the filesize in bytes, -1 or error. */
+static size_t afl_mmap_file(char *filename, char **buf_ptr) {
+
+    int ret = -1;
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+
+    int fd = open(filename, O_RDONLY);
+
+    struct stat st = {0};
+    if (fstat(fd, &st)) goto exit;
+
+    off_t in_len = st.st_size;
+<<<<<<< HEAD
+    if (in_len == -1) {
+	/* This can only ever happen on 32 bit if the file is exactly 4gb. */
+	fprintf(stderr, "Filesize of %s too large", filename);
+	goto exit;
+    }
+=======
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+
+    *buf_ptr = mmap(0, in_len, PROT_READ | PROT_WRITE, MAP_PRIVATE, fd, 0);
+
+    if (*buf_ptr != MAP_FAILED) ret = in_len;
+
+exit:
+    close(fd);
+    return ret;
+
+}
+
+/* Place the input at the right spot inside unicorn */
+<<<<<<< HEAD
+static bool place_input_callback(
+=======
+bool place_input_callback(
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+    uc_engine *uc, 
+    char *input, 
+    size_t input_len, 
+    uint32_t persistent_round, 
+    void *data
+){
+    // printf("Placing input with len %ld to %x\n", input_len, DATA_ADDRESS);
+<<<<<<< HEAD
+    if (input_len >= INPUT_SIZE_MAX - INPUT_OFFSET) {
+        // Test input too long, ignore this testcase
+        return false;
+    }
+    uc_mem_write(uc, INPUT_LOCATION + INPUT_OFFSET, input, input_len);
+    return true;
+}
+
+static void mem_map_checked(uc_engine *uc, uint64_t addr, size_t size, uint32_t mode) {
+    size = pad(size);
+    //printf("SIZE %lx, align: %lx\n", size, ALIGNMENT);
+=======
+    if (input_len > DATA_SIZE_MAX) {
+        // Test input too long, ignore this testcase
+        return false;
+    }
+    uc_mem_write(uc, DATA_ADDRESS, input, input_len);
+    return true;
+}
+
+void mem_map_checked(uc_engine *uc, uint64_t addr, size_t size, uint32_t mode) {
+    // align to 0x1000
+    if (size % 0x1000 != 0) {
+        size = (size / 0x1000) + 1 * 0x1000;
+    }
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+    uc_err err = uc_mem_map(uc, addr, size, mode);
+    if (err != UC_ERR_OK) {
+        printf("Error mapping %ld bytes at 0x%lx: %s (mode: %d)\n", size, addr, uc_strerror(err), mode);
+        exit(1);
+    }
+}
+
+int main(int argc, char **argv, char **envp) {
+    if (argc == 1) {
+<<<<<<< HEAD
+        printf("Test harness for simple_target.bin. Usage: harness [-t] <inputfile>\n");
+=======
+        printf("Test harness for simple_target.bin. Usage: harness [-t] <inputfile>");
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+        exit(1);
+    }
+    bool tracing = false;
+    char *filename = argv[1];
+    if (argc > 2 && !strcmp(argv[1], "-t")) {
+        tracing = true;
+        filename = argv[2];
+    }
+
+    uc_engine *uc;
+    uc_err err;
+    uc_hook hooks[2];
+    char *file_contents;
+
+<<<<<<< HEAD
+    // Initialize emulator in X86_64 mode
+    err = uc_open(UC_ARCH_X86, UC_MODE_64, &uc);
+=======
+    // Initialize emulator in MIPS mode
+    err = uc_open(UC_ARCH_MIPS, UC_MODE_MIPS32 + UC_MODE_BIG_ENDIAN, &uc);
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+    if (err) {
+        printf("Failed on uc_open() with error returned: %u (%s)\n",
+                err, uc_strerror(err));
+        return -1;
+    }
+
+    printf("Loading data input from %s\n", BINARY_FILE);
+<<<<<<< HEAD
+    off_t len = afl_mmap_file(BINARY_FILE, &file_contents);
+    if (len < 0) {
+        perror("Could not read binary to emulate");
+        return -2;
+    }
+    if (len == 0) {
+	fprintf(stderr, "File at '%s' is empty\n", BINARY_FILE);
+	return -3;
+    }
+
+    // Map memory.
+    mem_map_checked(uc, BASE_ADDRESS, len, UC_PROT_ALL);
+    printf("Len: %lx", len);
+    fflush(stdout);
+
+    // write machine code to be emulated to memory
+    if (uc_mem_write(uc, BASE_ADDRESS, file_contents, len) != UC_ERR_OK) {
+=======
+    size_t len = afl_mmap_file(BINARY_FILE, &file_contents);
+    if (len < 0) {
+        perror("Could not read data from file.");
+        return -2;
+    }
+
+    // Map memory.
+    mem_map_checked(uc, CODE_ADDRESS, len, UC_PROT_ALL);
+
+    // write machine code to be emulated to memory
+    if (uc_mem_write(uc, CODE_ADDRESS, &file_contents, len) != UC_ERR_OK) {
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+        printf("Error writing to CODE");
+    }
+
+    // Release copied contents
+    munmap(file_contents, len);
+
+    // Set the program counter to the start of the code
+    uint64_t start_address = CODE_ADDRESS;      // address of entry point of main()
+<<<<<<< HEAD
+    uint64_t end_address = END_ADDRESS; // Address of last instruction in main()
+    uc_reg_write(uc, UC_X86_REG_RIP, &start_address); // address of entry point of main()
+    
+    // Setup the Stack
+    mem_map_checked(uc, STACK_ADDRESS - STACK_SIZE, STACK_SIZE, UC_PROT_READ | UC_PROT_WRITE);
+    uint64_t stack_val = STACK_ADDRESS;
+    printf("%ld", stack_val);
+    uc_reg_write(uc, UC_X86_REG_RSP, &stack_val);
+
+    // reserve some space for our input data
+    mem_map_checked(uc, INPUT_LOCATION, INPUT_SIZE_MAX, UC_PROT_READ);
+
+    // build a "dummy" argv with lenth 2 at 0x10000: 
+    // 0x10000 argv[0]  NULL
+    // 0x10008 argv[1]  (char *)0x10016 --. points to the next offset.
+    // 0x10016 argv[1][0], ...          <-^ contains the acutal input data. (INPUT_LOCATION + INPUT_OFFSET)
+
+    uc_mem_write(uc, 0x10008, "\x16\x00\x01", 3); // little endian of 0x10016, see above
+
+    // Set up the function parameters accordingly RSI, RDI (see calling convention/disassembly)
+    uint64_t input_location = INPUT_LOCATION;
+    uc_reg_write(uc, UC_X86_REG_RSI, &input_location); // argv
+    uint64_t emulated_argc = 2;
+    uc_reg_write(uc, UC_X86_REG_RDI, &emulated_argc);  // argc == 2
+   
+=======
+    uint64_t end_address = CODE_ADDRESS + 0xf4; // Address of last instruction in main()
+    uc_reg_write(uc, UC_MIPS_REG_PC, &start_address); // address of entry point of main()
+    
+    // Setup the Stack
+    mem_map_checked(uc, STACK_ADDRESS, STACK_SIZE, UC_PROT_ALL);
+    uint64_t stack_val = STACK_ADDRESS + STACK_SIZE;
+    printf("%ld", stack_val);
+    uc_reg_write(uc, UC_MIPS_REG_SP, &stack_val);
+
+    // reserve some space for dat
+    mem_map_checked(uc, DATA_ADDRESS, DATA_SIZE_MAX, UC_PROT_ALL);
+
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+    // If we want tracing output, set the callbacks here
+    if (tracing) {
+        // tracing all basic blocks with customized callback
+        uc_hook_add(uc, &hooks[0], UC_HOOK_BLOCK, hook_block, NULL, 1, 0);
+<<<<<<< HEAD
+        uc_hook_add(uc, &hooks[1], UC_HOOK_CODE, hook_code, NULL, BASE_ADDRESS, BASE_ADDRESS + len - 1);
+=======
+        uc_hook_add(uc, &hooks[1], UC_HOOK_CODE, hook_code, NULL, CODE_ADDRESS, CODE_ADDRESS + len - 1);
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+    }
+
+    printf("Starting to fuzz :)\n");
+    fflush(stdout);
+
+    // let's gooo
+    uc_afl_ret afl_ret = uc_afl_fuzz(
+<<<<<<< HEAD
+        uc, // The unicorn instance we prepared
+        filename, // Filename of the input to process. In AFL this is usually the '@@' placeholder, outside it's any input file.
+        place_input_callback, // Callback that places the input (automatically loaded from the file at filename) in the unicorninstance
+        &end_address, // Where to exit (this is an array)
+        1,  // Count of end addresses
+        NULL, // Optional calback to run after each exec
+        false,
+        1, // For persistent mode: How many rounds to run
+=======
+        uc,
+        filename,
+        place_input_callback,
+        &end_address,
+        1,
+        NULL,
+        false,
+        1,
+>>>>>>> 183a0e7845568def7c6c0118a7ba8128eb094200
+        NULL
+    );
+    switch(afl_ret) {
+        case UC_AFL_RET_ERROR:
+            printf("Error starting to fuzz");
+            return -3;
+            break;
+        case UC_AFL_RET_NO_AFL:
+            printf("No AFL attached - We are done with a single run.");
+            break;
+        default:
+            break;
+    } 
+    return 0;
+}
diff --git a/unicorn_mode/samples/c/sample_all.sh b/unicorn_mode/samples/c/sample_all.sh
new file mode 100644
index 00000000..01daf365
--- /dev/null
+++ b/unicorn_mode/samples/c/sample_all.sh
@@ -0,0 +1,18 @@
+#!/bin/sh
+
+[ -z "${UNAME}" ] && UNAME=$(uname)
+
+DIR=`dirname $0`
+
+if [ "$UNAME" = Darwin ]; then
+  export DYLD_LIBRARY_PATH=../../unicorn
+else
+  export LD_LIBRARY_PATH=../../unicorn
+fi
+
+
+
+if [ ! test -e $DIR/harness]; then
+  echo "[!] harness not found in $DIR"
+  exit 1
+fi
\ No newline at end of file
diff --git a/unicorn_mode/samples/c/sample_inputs/sample1.bin b/unicorn_mode/samples/c/sample_inputs/sample1.bin
new file mode 100644
index 00000000..85df5078
--- /dev/null
+++ b/unicorn_mode/samples/c/sample_inputs/sample1.bin
@@ -0,0 +1 @@
+abcd
\ No newline at end of file
diff --git a/unicorn_mode/samples/c/sample_inputs/sample2.bin b/unicorn_mode/samples/c/sample_inputs/sample2.bin
new file mode 100644
index 00000000..f76dd238
--- /dev/null
+++ b/unicorn_mode/samples/c/sample_inputs/sample2.bin
Binary files differdiff --git a/unicorn_mode/samples/c/sample_inputs/sample3.bin b/unicorn_mode/samples/c/sample_inputs/sample3.bin
new file mode 100644
index 00000000..6b2aaa76
--- /dev/null
+++ b/unicorn_mode/samples/c/sample_inputs/sample3.bin
@@ -0,0 +1 @@
+
\ No newline at end of file
diff --git a/unicorn_mode/samples/c/sample_inputs/sample4.bin b/unicorn_mode/samples/c/sample_inputs/sample4.bin
new file mode 100644
index 00000000..71bd63e6
--- /dev/null
+++ b/unicorn_mode/samples/c/sample_inputs/sample4.bin
@@ -0,0 +1 @@
+
\ No newline at end of file
diff --git a/unicorn_mode/samples/c/sample_inputs/sample5.bin b/unicorn_mode/samples/c/sample_inputs/sample5.bin
new file mode 100644
index 00000000..aed2973e
--- /dev/null
+++ b/unicorn_mode/samples/c/sample_inputs/sample5.bin
@@ -0,0 +1 @@
+
\ No newline at end of file
diff --git a/unicorn_mode/samples/c/simple_target.c b/unicorn_mode/samples/c/simple_target.c
new file mode 100644
index 00000000..dbf10911
--- /dev/null
+++ b/unicorn_mode/samples/c/simple_target.c
@@ -0,0 +1,34 @@
+/*
+ * Sample target file to test afl-unicorn fuzzing capabilities.
+ * This is a very trivial example that will crash pretty easily
+ * in several different exciting ways. 
+ *
+ * Input is assumed to come from a buffer located at DATA_ADDRESS 
+ * (0x00300000), so make sure that your Unicorn emulation of this 
+ * puts user data there.
+ *
+ * Written by Nathan Voss <njvoss99@gmail.com>
+ * Adapted by Lukas Seidel <seidel.1@campus.tu-berlin.de>
+ */
+
+
+int main(int argc, char** argv) {
+  if(argc < 2){
+     return -1;
+  }
+
+  char *data_buf = argv[1];
+
+  if (data_buf[20] != 0) {
+    // Cause an 'invalid read' crash if data[0..3] == '\x01\x02\x03\x04'
+    unsigned char invalid_read = *(unsigned char *) 0x00000000;
+  } else if (data_buf[0] > 0x10 && data_buf[0] < 0x20 && data_buf[1] > data_buf[2]) {
+    // Cause an 'invalid read' crash if (0x10 < data[0] < 0x20) and data[1] > data[2]
+    unsigned char invalid_read = *(unsigned char *) 0x00000000;
+  } else if (data_buf[9] == 0x00 && data_buf[10] != 0x00 && data_buf[11] == 0x00) {
+    // Cause a crash if data[10] is not zero, but [9] and [11] are zero
+    unsigned char invalid_read = *(unsigned char *) 0x00000000;
+  }
+
+  return 0;
+}
diff --git a/unicorn_mode/samples/c/simple_target_x86_64 b/unicorn_mode/samples/c/simple_target_x86_64
new file mode 100644
index 00000000..560264fd
--- /dev/null
+++ b/unicorn_mode/samples/c/simple_target_x86_64
Binary files differ