mirror of
https://github.com/radareorg/radare2.git
synced 2025-01-25 15:24:36 +00:00
bfbd12ed3c
* Update and simplify gdiff
273 lines
7.4 KiB
C
273 lines
7.4 KiB
C
/* radare - LGPL - Copyright 2010 - nibble<develsec.org> */
|
|
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#include <r_anal.h>
|
|
#include <r_list.h>
|
|
#include <r_util.h>
|
|
#include <r_core.h>
|
|
#include "gdiff.h"
|
|
|
|
/* XXX NEED A HASH ALGO */
|
|
static ut32 gdiff_get_prime(char* mnemonic) {
|
|
int i;
|
|
|
|
if (mnemonic)
|
|
for (i=0; i < 442; i++)
|
|
if (!strcmp (mnemonic, mnemonics[i]))
|
|
return primes[i];
|
|
return 1;
|
|
#if 0
|
|
ut64 index = 0;
|
|
char *ch;
|
|
|
|
ch = (char *)mnemonic + strlen (mnemonic)-1;
|
|
do {
|
|
index = index*32 + (*ch-0x60) & 0xff;
|
|
} while (ch-- > (char*)mnemonic);
|
|
return primes[index % sizeof (primes)];
|
|
#endif
|
|
}
|
|
|
|
static void gdiff_fingerprint_bb(RAnalBlock *bb) {
|
|
RAnalOp *op;
|
|
RListIter *iter;
|
|
|
|
r_big_set_str (bb->fingerprint, "1");
|
|
r_list_foreach (bb->aops, iter, op)
|
|
r_big_mul_ut (bb->fingerprint, bb->fingerprint, gdiff_get_prime (op->mnemonic));
|
|
}
|
|
|
|
static void gdiff_fingerprint_fcn(RList *bbs, RAnalFcn *fcn) {
|
|
RAnalBlock *bb;
|
|
RListIter *iter;
|
|
|
|
r_big_set_str (fcn->fingerprint, "1");
|
|
r_list_foreach (bbs, iter, bb)
|
|
if (bb->addr >= fcn->addr && bb->addr < fcn->addr + fcn->size)
|
|
r_big_mul (fcn->fingerprint, fcn->fingerprint, bb->fingerprint);
|
|
}
|
|
|
|
static void gdiff_diff_bb(RAnalFcn *mfcn, RAnalFcn *mfcn2, RList *bbs, RList *bbs2) {
|
|
RAnalBlock *bb, *bb2, *mbb, *mbb2;
|
|
RListIter *iter, *iter2;
|
|
RNumBig *fingerprint, *fingerprint2;
|
|
float t, ot;
|
|
int i, p;
|
|
|
|
fingerprint = r_big_new (NULL);
|
|
fingerprint2 = r_big_new (NULL);
|
|
|
|
iter = r_list_iterator (bbs);
|
|
while (r_list_iter_next (iter)) {
|
|
bb = r_list_iter_get (iter);
|
|
if (bb->diff == R_ANAL_DIFF_NULL &&
|
|
bb->addr >= mfcn->addr && bb->addr < mfcn->addr + mfcn->size) {
|
|
ot = 0;
|
|
mbb = mbb2 = NULL;
|
|
iter2 = r_list_iterator (bbs2);
|
|
while (r_list_iter_next (iter2)) {
|
|
bb2 = r_list_iter_get (iter2);
|
|
if (bb2->diff == R_ANAL_DIFF_NULL &&
|
|
bb2->addr >= mfcn2->addr && bb2->addr < mfcn2->addr + mfcn2->size) {
|
|
p = 0;
|
|
t = 0;
|
|
if (r_big_cmp (bb->fingerprint, bb2->fingerprint) != 0) {
|
|
r_big_set (fingerprint, bb->fingerprint);
|
|
r_big_set (fingerprint2, bb2->fingerprint);
|
|
while ( r_big_cmp_st (fingerprint, 1) != 0 &&
|
|
r_big_cmp_st (fingerprint2, 1) != 0) {
|
|
for (i = 0; i < NPRIMES; i++)
|
|
if (r_big_divisible_ut (fingerprint, primes[i]) &&
|
|
r_big_divisible_ut (fingerprint2, primes[i])) {
|
|
r_big_div_ut (fingerprint, fingerprint, primes[i]);
|
|
r_big_div_ut (fingerprint2, fingerprint2, primes[i]);
|
|
p++;
|
|
break;
|
|
}
|
|
if (i == NPRIMES)
|
|
break;
|
|
}
|
|
} else {
|
|
if (bb->ninstr > bb2->ninstr)
|
|
p = bb->ninstr;
|
|
else p = bb2->ninstr;
|
|
}
|
|
if (bb->ninstr > bb2->ninstr)
|
|
t = (float)1-(float)(bb->ninstr-p)/bb->ninstr;
|
|
else t = (float)1-(float)(bb2->ninstr-p)/bb2->ninstr;
|
|
#if 0
|
|
printf ("BB: %llx - %llx => %i - %i - %i => %f\n", bb->addr, bb2->addr,
|
|
bb->ninstr, bb2->ninstr, p, t);
|
|
#endif
|
|
if (t > THRESHOLDBB && t > ot) {
|
|
ot = t;
|
|
mbb = bb;
|
|
mbb2 = bb2;
|
|
}
|
|
}
|
|
}
|
|
if (mbb != NULL && mbb2 != NULL) {
|
|
if (ot == 1)
|
|
mbb->diff = mbb2->diff = R_ANAL_DIFF_MATCH;
|
|
else
|
|
mbb->diff = mbb2->diff = R_ANAL_DIFF_UNMATCH;
|
|
}
|
|
}
|
|
}
|
|
|
|
r_big_free (fingerprint);
|
|
r_big_free (fingerprint2);
|
|
}
|
|
|
|
static void gdiff_diff_fcn(RList *fcns, RList *fcns2, RList *bbs, RList *bbs2) {
|
|
RAnalFcn *fcn, *fcn2, *mfcn, *mfcn2;
|
|
RListIter *iter, *iter2;
|
|
RNumBig *fingerprint, *fingerprint2;
|
|
float t, ot;
|
|
int i, p;
|
|
|
|
fingerprint = r_big_new (NULL);
|
|
fingerprint2 = r_big_new (NULL);
|
|
|
|
iter = r_list_iterator (fcns);
|
|
while (r_list_iter_next (iter)) {
|
|
fcn = r_list_iter_get (iter);
|
|
ot = 0;
|
|
mfcn = mfcn2 = NULL;
|
|
iter2 = r_list_iterator (fcns2);
|
|
while (r_list_iter_next (iter2)) {
|
|
fcn2 = r_list_iter_get (iter2);
|
|
p = 0;
|
|
t = 0;
|
|
if (r_big_cmp (fcn->fingerprint, fcn2->fingerprint) != 0) {
|
|
r_big_set (fingerprint, fcn->fingerprint);
|
|
r_big_set (fingerprint2, fcn2->fingerprint);
|
|
while ( r_big_cmp_st (fingerprint, 1) != 0 &&
|
|
r_big_cmp_st (fingerprint2, 1) != 0) {
|
|
for (i = 0; i < NPRIMES; i++)
|
|
if (r_big_divisible_ut (fingerprint, primes[i]) &&
|
|
r_big_divisible_ut (fingerprint2, primes[i])) {
|
|
r_big_div_ut (fingerprint, fingerprint, primes[i]);
|
|
r_big_div_ut (fingerprint2, fingerprint2, primes[i]);
|
|
p++;
|
|
break;
|
|
}
|
|
if (i == NPRIMES)
|
|
break;
|
|
}
|
|
} else {
|
|
if (fcn->ninstr > fcn2->ninstr)
|
|
p = fcn->ninstr;
|
|
else p = fcn2->ninstr;
|
|
}
|
|
if (fcn->ninstr > fcn2->ninstr)
|
|
t = (float)1-(float)(fcn->ninstr-p)/fcn->ninstr;
|
|
else t = (float)1-(float)(fcn2->ninstr-p)/fcn2->ninstr;
|
|
#if 0
|
|
printf ("FCN: %s - %s => %i - %i - %i => %f\n", fcn->name, fcn2->name,
|
|
fcn->ninstr, fcn2->ninstr, p, t);
|
|
#endif
|
|
if (t > THRESHOLDFCN && t > ot) {
|
|
ot = t;
|
|
mfcn = fcn;
|
|
mfcn2 = fcn2;
|
|
}
|
|
}
|
|
if (mfcn != NULL && mfcn2 != NULL) {
|
|
/* Diff basic blocks and remove matched functions */
|
|
#if 0
|
|
printf ("Match => %s - %s\n", mfcn->name, mfcn2->name);
|
|
#endif
|
|
if (ot == 1)
|
|
mfcn->diff = mfcn2->diff = R_ANAL_DIFF_MATCH;
|
|
else
|
|
mfcn->diff = mfcn2->diff = R_ANAL_DIFF_UNMATCH;
|
|
gdiff_diff_bb (mfcn, mfcn2, bbs, bbs2);
|
|
}
|
|
}
|
|
|
|
r_big_free (fingerprint);
|
|
r_big_free (fingerprint2);
|
|
}
|
|
|
|
R_API int r_core_gdiff(RCore *core, char *file1, char *file2, int va) {
|
|
RCore *core2;
|
|
RAnalFcn *fcn;
|
|
RAnalBlock *bb;
|
|
RList *fcns[2], *bbs[2];
|
|
RListIter *iter;
|
|
char *files[2] = {file1, file2};
|
|
int i;
|
|
|
|
/* Init resources */
|
|
core2 = r_core_new ();
|
|
|
|
for (i = 0; i < 2; i++) {
|
|
/* Load and analyze bin*/
|
|
r_config_set_i (core2->config, "io.va", va);
|
|
if (!r_core_file_open (core2, files[i], 0)) {
|
|
fprintf (stderr, "Cannot open file '%s'\n", files[i]);
|
|
return R_FALSE;
|
|
}
|
|
r_config_set (core2->config, "anal.plugin", "x86_x86im");
|
|
r_config_set_i (core2->config, "anal.split", 0);
|
|
r_core_cmd0 (core2, "fs *");
|
|
r_core_cmd0 (core2, "af @ entry0");
|
|
r_core_cmd0 (core2, "af @ main");
|
|
r_core_cmd0 (core2, "af @@ fcn.");
|
|
r_core_cmd0 (core2, "ab @@ fcn.");
|
|
/* Copy bb's and fcn's */
|
|
bbs[i] = r_list_new ();
|
|
bbs[i]->free = &r_anal_bb_free;
|
|
iter = r_list_iterator (core2->anal->bbs);
|
|
while (r_list_iter_next (iter)) {
|
|
bb = r_list_iter_get (iter);
|
|
r_list_split (core2->anal->bbs, bb);
|
|
r_list_append (bbs[i], bb);
|
|
}
|
|
fcns[i] = r_list_new ();
|
|
fcns[i]->free = &r_anal_fcn_free;
|
|
iter = r_list_iterator (core2->anal->fcns);
|
|
while (r_list_iter_next (iter)) {
|
|
fcn = r_list_iter_get (iter);
|
|
r_list_split (core2->anal->fcns, fcn);
|
|
r_list_append (fcns[i], fcn);
|
|
}
|
|
/* Fingerprint bb's and fcn's */
|
|
r_list_foreach (bbs[i], iter, bb)
|
|
gdiff_fingerprint_bb (bb);
|
|
r_list_foreach (fcns[i], iter, fcn)
|
|
gdiff_fingerprint_fcn (bbs[i], fcn);
|
|
/* Remove flags and analysis info */
|
|
r_core_cmd0 (core2, "af-");
|
|
r_core_cmd0 (core2, "ab-");
|
|
r_core_cmd0 (core2, "f-*");
|
|
}
|
|
|
|
/* Diff functions */
|
|
/* XXX Avoid dupped code diffing bb's directly? */
|
|
gdiff_diff_fcn (fcns[0], fcns[1], bbs[0], bbs[1]);
|
|
|
|
/* Fill analysis info in core */
|
|
iter = r_list_iterator (bbs[0]);
|
|
while (r_list_iter_next (iter)) {
|
|
bb = r_list_iter_get (iter);
|
|
r_anal_bb_add (core->anal, bb->addr, bb->size, bb->jump, bb->fail, bb->type, bb->diff);
|
|
}
|
|
iter = r_list_iterator (fcns[0]);
|
|
while (r_list_iter_next (iter)) {
|
|
fcn = r_list_iter_get (iter);
|
|
r_anal_fcn_add (core->anal, fcn->addr, fcn->size, fcn->name, fcn->diff);
|
|
}
|
|
|
|
/* Free resources */
|
|
r_core_free (core2);
|
|
for (i=0;i<2;i++) {
|
|
r_list_free (bbs[i]);
|
|
r_list_free (fcns[i]);
|
|
}
|
|
|
|
return R_TRUE;
|
|
}
|