[Forensics-changes] [yara] 179/415: Some code cleanup

Thu Apr 3 05:43:02 UTC 2014

This is an automated email from the git hooks/post-receive script.

bengen pushed a commit to branch debian
in repository yara.

commit ac0319ca05ffcbe5558eb0ded14a729ebc88bbde
Author: Victor M. Alvarez <plusvic at gmail.com>
Date:   Wed Jun 26 11:34:30 2013 +0000

    Some code cleanup
---
 libyara/ahocorasick.c | 285 +++++++++++++++++++++++++-------------------------
 libyara/exec.c        |  37 ++-----
 libyara/mem.c         |  47 ++++++---
 3 files changed, 181 insertions(+), 188 deletions(-)

diff --git a/libyara/ahocorasick.c b/libyara/ahocorasick.c
index 6038ca8..e3f33db 100644
--- a/libyara/ahocorasick.c
+++ b/libyara/ahocorasick.c
@@ -24,9 +24,12 @@ limitations under the License.
 #include "yara.h"
 
 
-#define MAX_TOKEN 4
+#define MAX_ATOM 4
 #define MAX_TABLE_BASED_STATES_DEPTH 1
 
+#ifdef _MSC_VER
+#define inline __inline
+#endif
 
 #ifndef min
 #define min(x, y) ((x < y) ? (x) : (y))
@@ -342,65 +345,65 @@ AC_STATE* _yr_ac_create_state(
 //
 // _yr_ac_gen_case_combinations
 //
-// Returns all combinations of lower and upper cases for a given token. For
-// token "abc" the output would be "abc" "abC" "aBC" and so on. Resulting
-// tokens are written into the output buffer in this format:
+// Returns all combinations of lower and upper cases for a given atom. For
+// atom "abc" the output would be "abc" "abC" "aBC" and so on. Resulting
+// atoms are written into the output buffer in this format:
 //
-//  [size 1] [backtrack 1] [token 1]  ... [size N] [backtrack N] [token N] [0]
+//  [size 1] [backtrack 1] [atom 1]  ... [size N] [backtrack N] [atom N] [0]
 //
 // Notice the zero at the end to indicate where the output ends.
 //
 // The caller is responsible of providing a buffer large enough to hold the
-// returned tokens.
+// returned atoms.
 //
 
 uint8_t* _yr_ac_gen_case_combinations(
-    uint8_t* token,
-    int token_length,
-    int token_offset,
-    int token_backtrack,
+    uint8_t* atom,
+    int atom_length,
+    int atom_offset,
+    int atom_backtrack,
     uint8_t* output_buffer)
 {
   char c;
-  char* new_token;
+  char* new_atom;
 
-  if (token_offset + 1 < token_length)
+  if (atom_offset + 1 < atom_length)
     output_buffer = _yr_ac_gen_case_combinations(
-        token,
-        token_length,
-        token_offset + 1,
-        token_backtrack,
+        atom,
+        atom_length,
+        atom_offset + 1,
+        atom_backtrack,
         output_buffer);
 
-  c = token[token_offset];
+  c = atom[atom_offset];
 
   if ((c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z'))
   {
-    // Write token length.
-    *((int*) output_buffer) = token_length;
+    // Write atom length.
+    *((int*) output_buffer) = atom_length;
     output_buffer += sizeof(int);
 
-    // Write token backtrack.
-    *((int*) output_buffer) = token_backtrack;
+    // Write atom backtrack.
+    *((int*) output_buffer) = atom_backtrack;
     output_buffer += sizeof(int);
 
-    memcpy(output_buffer, token, token_length);
+    memcpy(output_buffer, atom, atom_length);
 
-    new_token = output_buffer;
-    output_buffer += token_length;
+    new_atom = output_buffer;
+    output_buffer += atom_length;
 
     // Swap character case.
     if (c >= 'a' && c <= 'z')
-      new_token[token_offset] -= 32;
+      new_atom[atom_offset] -= 32;
     else
-      new_token[token_offset] += 32;
+      new_atom[atom_offset] += 32;
 
-    if (token_offset + 1 < token_length)
+    if (atom_offset + 1 < atom_length)
       output_buffer = _yr_ac_gen_case_combinations(
-          new_token,
-          token_length,
-          token_offset + 1,
-          token_backtrack,
+          new_atom,
+          atom_length,
+          atom_offset + 1,
+          atom_backtrack,
           output_buffer);
   }
 
@@ -408,48 +411,48 @@ uint8_t* _yr_ac_gen_case_combinations(
 }
 
 //
-// _yr_ac_gen_hex_tokens
+// _yr_ac_gen_hex_atoms
 //
-// Generates token for a hex string. The token will be a substring of length
-// up to MAX_TOKEN, generally a prefix, but not necessarily. The token can
+// Generates atom for a hex string. The atom will be a substring of length
+// up to MAX_ATOM, generally a prefix, but not necessarily. The atom can
 // also be extracted from the middle of the string when the prefix is not long
-// enough. The function will try to choose a token with as many distinct bytes
-// as posible, avoiding tokens like 00 00 00 00 which are too common.
+// enough. The function will try to choose an atom with as many distinct bytes
+// as posible, avoiding atoms like 00 00 00 00 which are too common.
 // For example, in the string
 //
 //    98 56 ?? ?? 00 00 00 00 34 EB 45 97 21
 //
-// the token would be 34 EB 45 97 (assuming MAX_TOKEN is 4) instead of 98 56,
+// the atom would be 34 EB 45 97 (assuming MAX_ATOM is 4) instead of 98 56,
 // which is shorter, or 00 00 00 00 which is more homogeneous.
 //
 
-uint8_t* _yr_ac_gen_hex_tokens(
+uint8_t* _yr_ac_gen_hex_atoms(
     STRING* string,
-    int max_token_length,
+    int max_atom_length,
     uint8_t* output_buffer)
 {
   int inside_or = 0;
-  int token_length = 0;
+  int atom_length = 0;
   int backtrack = 0;
   int unique_bytes = 0;
   int max_unique_bytes = 0;
-  int candidate_token_position = 0;
-  int candidate_token_length = 0;
-  int candidate_token_backtrack = 0;
+  int candidate_atom_position = 0;
+  int candidate_atom_length = 0;
+  int candidate_atom_backtrack = 0;
   int or_string_length = 0;
   int previous_or_string_length = 0;
   int string_position = 0;
   int i, j, unique;
 
   uint8_t* mask;
-  uint8_t last[MAX_TOKEN];
+  uint8_t last[MAX_ATOM];
 
   mask = string->mask;
 
   while (*mask != MASK_END)
   {
-    if (token_length == 0)
-      for (i = 0; i < max_token_length; i++)
+    if (atom_length == 0)
+      for (i = 0; i < max_atom_length; i++)
         last[i] = string->string[string_position];
 
     // We entered an OR operation like (01 | 02).
@@ -461,21 +464,21 @@ uint8_t* _yr_ac_gen_hex_tokens(
       inside_or = FALSE;
 
     // If non-wildcard byte and not inside an OR it could
-    // be used for the token.
+    // be used for the atom.
     if (*mask == 0xFF && !inside_or)
     {
-      token_length++;
-      token_length = min(token_length, max_token_length);
+      atom_length++;
+      atom_length = min(atom_length, max_atom_length);
 
-      last[string_position % max_token_length] = \
+      last[string_position % max_atom_length] = \
           string->string[string_position];
 
       unique_bytes = 1;
 
-      for (i = 0; i < max_token_length - 1; i++)
+      for (i = 0; i < max_atom_length - 1; i++)
       {
         unique = TRUE;
-        for (j = i + 1; j < max_token_length; j++)
+        for (j = i + 1; j < max_atom_length; j++)
         {
           if (last[i] == last[j])
           {
@@ -488,21 +491,21 @@ uint8_t* _yr_ac_gen_hex_tokens(
       }
 
       if (unique_bytes > max_unique_bytes ||
-          token_length > candidate_token_length)
+          atom_length > candidate_atom_length)
       {
         max_unique_bytes = unique_bytes;
-        candidate_token_position = string_position - token_length + 1;
-        candidate_token_backtrack = backtrack - token_length + 1;
-        candidate_token_length = token_length;
+        candidate_atom_position = string_position - atom_length + 1;
+        candidate_atom_backtrack = backtrack - atom_length + 1;
+        candidate_atom_length = atom_length;
 
-        if (candidate_token_length == max_token_length &&
-            max_unique_bytes == max_token_length)
+        if (candidate_atom_length == max_atom_length &&
+            max_unique_bytes == max_atom_length)
           break;
       }
     }
     else
     {
-      token_length = 0;
+      atom_length = 0;
     }
 
     if (*mask != MASK_OR &&
@@ -536,7 +539,7 @@ uint8_t* _yr_ac_gen_hex_tokens(
       // alternatives of different size like: (01 | 02 03)
       // instead of (01 | 02). In those cases the backtrack
       // value would be different for each alternative, so
-      // we don't want any token past the OR.
+      // we don't want any atom past the OR.
       if (or_string_length != previous_or_string_length)
         break;
 
@@ -552,46 +555,46 @@ uint8_t* _yr_ac_gen_hex_tokens(
     mask++;
   }
 
-  *((int*) output_buffer) = candidate_token_length;
+  *((int*) output_buffer) = candidate_atom_length;
   output_buffer += sizeof(int);
 
-  *((int*) output_buffer) = candidate_token_backtrack;
+  *((int*) output_buffer) = candidate_atom_backtrack;
   output_buffer += sizeof(int);
 
   memcpy(
       output_buffer,
-      string->string + candidate_token_position,
-      candidate_token_length);
+      string->string + candidate_atom_position,
+      candidate_atom_length);
 
-  output_buffer += candidate_token_length;
+  output_buffer += candidate_atom_length;
 
   return output_buffer;
 }
 
 //
-// _yr_ac_gen_regexp_tokens
+// _yr_ac_gen_regexp_atoms
 //
-// Generates tokens for a regular expression.
+// Generates atoms for a regular expression.
 //
 
-uint8_t* _yr_ac_gen_regexp_tokens(
+uint8_t* _yr_ac_gen_regexp_atoms(
     STRING* string,
-    int max_token_length,
+    int max_atom_length,
     uint8_t* output_buffer)
 {
-  uint8_t token[MAX_TOKEN];
+  uint8_t atom[MAX_ATOM];
   uint8_t first_bytes[256];
   uint8_t current;
   uint8_t next;
 
   int first_bytes_count;
-  int token_length = 0;
+  int atom_length = 0;
   int i = 0;
 
   if (string->string[0] == '^')
     i++;
 
-  while (i < string->length && token_length < max_token_length)
+  while (i < string->length && atom_length < max_atom_length)
   {
     current = string->string[i];
 
@@ -602,20 +605,20 @@ uint8_t* _yr_ac_gen_regexp_tokens(
 
     if (current == '\\' && isregexescapable[next])
     {
-      token[token_length] = next;
-      token_length++;
+      atom[atom_length] = next;
+      atom_length++;
       i += 2;
     }
     else if (isregexhashable[current] &&
              next != '*' && next != '{' && next != '?')
     {
-      // Add current character to the token if it's hashable and the next one
+      // Add current character to the atom if it's hashable and the next one
       // is not a quantifier. Quantifiers can make the character optional like
       // in abc*, abc{0,N}, abc?. In all this regexps the 'c' is not required
       // to appear in a matching string.
 
-      token[token_length] = current;
-      token_length++;
+      atom[atom_length] = current;
+      atom_length++;
       i++;
     }
     else
@@ -624,21 +627,21 @@ uint8_t* _yr_ac_gen_regexp_tokens(
     }
   }
 
-  if (token_length > 0)
+  if (atom_length > 0)
   {
-    *((int*) output_buffer) = token_length;
+    *((int*) output_buffer) = atom_length;
     output_buffer += sizeof(int);
 
     *((int*) output_buffer) = 0;
     output_buffer += sizeof(int);
 
-    memcpy(output_buffer, token, token_length);
-    output_buffer += token_length;
+    memcpy(output_buffer, atom, atom_length);
+    output_buffer += atom_length;
 
     if (STRING_IS_NO_CASE(string))
       output_buffer = _yr_ac_gen_case_combinations(
-          token,
-          token_length,
+          atom,
+          atom_length,
           0,
           0,
           output_buffer);
@@ -649,7 +652,7 @@ uint8_t* _yr_ac_gen_regexp_tokens(
 
     for (i = 0; i < first_bytes_count; i++)
     {
-      // Write token length.
+      // Write atom length.
       *((int*) output_buffer) = 1;
       output_buffer += sizeof(int);
 
@@ -667,46 +670,46 @@ uint8_t* _yr_ac_gen_regexp_tokens(
 
 
 //
-// _yr_ac_gen_tokens
+// _yr_ac_gen_atoms
 //
-// Returns the tokens to be added to the Aho-Corasick automaton for
-// a given YARA string. Length of tokens is limited by max_token_lengh.
+// Returns the atoms to be added to the Aho-Corasick automaton for
+// a given YARA string. Length of atoms is limited by max_atom_lengh.
 // Tokens are written to the output buffer in the same format used by
 // _yr_ac_gen_case_combinations.
 //
 
-void _yr_ac_gen_tokens(
+void _yr_ac_gen_atoms(
     STRING* string,
-    int max_token_length,
+    int max_atom_length,
     uint8_t* output_buffer)
 {
   int i, j;
-  int token_length;
+  int atom_length;
   void* str;
 
 
   if (STRING_IS_HEX(string))
   {
-    output_buffer = _yr_ac_gen_hex_tokens(
+    output_buffer = _yr_ac_gen_hex_atoms(
         string,
-        max_token_length,
+        max_atom_length,
         output_buffer);
   }
   else if (STRING_IS_REGEXP(string))
   {
-    output_buffer = _yr_ac_gen_regexp_tokens(
+    output_buffer = _yr_ac_gen_regexp_atoms(
         string,
-        max_token_length,
+        max_atom_length,
         output_buffer);
   }
   else // text string
   {
     if (STRING_IS_ASCII(string))
     {
-      token_length = min(string->length, max_token_length);
+      atom_length = min(string->length, max_atom_length);
 
-      // Write token length.
-      *((int*) output_buffer) = token_length;
+      // Write atom length.
+      *((int*) output_buffer) = atom_length;
       output_buffer += sizeof(int);
 
       // Write backtrack value.
@@ -715,14 +718,14 @@ void _yr_ac_gen_tokens(
 
       str = output_buffer;
 
-      memcpy(output_buffer, string->string, token_length);
-      output_buffer += token_length;
+      memcpy(output_buffer, string->string, atom_length);
+      output_buffer += atom_length;
 
       if (STRING_IS_NO_CASE(string))
       {
         output_buffer = _yr_ac_gen_case_combinations(
             str,
-            token_length,
+            atom_length,
             0,
             0,
             output_buffer);
@@ -731,10 +734,10 @@ void _yr_ac_gen_tokens(
 
     if (STRING_IS_WIDE(string))
     {
-      token_length = min(string->length * 2, max_token_length);
+      atom_length = min(string->length * 2, max_atom_length);
 
-      // Write token length.
-      *((int*) output_buffer) = token_length;
+      // Write atom length.
+      *((int*) output_buffer) = atom_length;
       output_buffer += sizeof(int);
 
       // Write backtrack value.
@@ -744,7 +747,7 @@ void _yr_ac_gen_tokens(
       str = output_buffer;
       i = j = 0;
 
-      while(i < token_length)
+      while(i < atom_length)
       {
         if (i % 2 == 0)
           *(((uint8_t*) output_buffer)++) = string->string[j++];
@@ -757,7 +760,7 @@ void _yr_ac_gen_tokens(
       {
         output_buffer = _yr_ac_gen_case_combinations(
             str,
-            token_length,
+            atom_length,
             0,
             0,
             output_buffer);
@@ -941,46 +944,46 @@ int yr_ac_add_string(
     ARENA* arena,
     AC_AUTOMATON* automaton,
     STRING* string,
-    int* min_token_length)
+    int* min_atom_length)
 {
   int result;
-  int token_length;
-  int token_backtrack;
+  int atom_length;
+  int atom_backtrack;
   int i;
 
   AC_STATE* state;
   AC_STATE* next_state;
   AC_MATCH* new_match;
 
-  uint8_t* tokens;
-  uint8_t* tokens_cursor;
+  uint8_t* atoms;
+  uint8_t* atoms_cursor;
 
-  // Reserve memory to hold tokens for the string. We reserve enough memory
+  // Reserve memory to hold atoms for the string. We reserve enough memory
   // for the worst case which is a "ascii wide nocase" text string.
 
-  tokens = yr_malloc(
-      2 * (1 << MAX_TOKEN) * (2 * sizeof(int) + MAX_TOKEN) + sizeof(int));
+  atoms = yr_malloc(
+      2 * (1 << MAX_ATOM) * (2 * sizeof(int) + MAX_ATOM) + sizeof(int));
 
-  if (tokens == NULL)
+  if (atoms == NULL)
     return ERROR_INSUFICIENT_MEMORY;
 
-  tokens_cursor = tokens;
+  atoms_cursor = atoms;
 
-  // Generate all posible tokens for the string. These tokens are substrings up
-  // to MAX_TOKEN bytes length, which are generally a prefix of the strings,
-  // but not necessarily. For hex strings token can be extracted from the middle
-  // of the string. This tokens are added to the Aho-Corasick automaton.
+  // Generate all posible atoms for the string. These atoms are substrings up
+  // to MAX_ATOM bytes length, which are generally a prefix of the strings,
+  // but not necessarily. For hex strings atom can be extracted from the middle
+  // of the string. This atoms are added to the Aho-Corasick automaton.
 
-  _yr_ac_gen_tokens(string, MAX_TOKEN, tokens);
+  _yr_ac_gen_atoms(string, MAX_ATOM, atoms);
 
-  token_length = *((int*) tokens_cursor);
-  tokens_cursor += sizeof(int);
+  atom_length = *((int*) atoms_cursor);
+  atoms_cursor += sizeof(int);
 
-  if (token_length == 0)
+  if (atom_length == 0)
   {
-    *min_token_length = 0;
+    *min_atom_length = 0;
 
-    // No token could be extracted from the string, put the string in the
+    // No atom could be extracted from the string, put the string in the
     // automaton's root state. This is far from ideal, because the string will
     // be tried at every data offset during scanning.
 
@@ -1002,46 +1005,46 @@ int yr_ac_add_string(
   }
   else
   {
-    // For each token create the states in the automaton.
+    // For each atom create the states in the automaton.
 
-    *min_token_length = MAX_TOKEN;
+    *min_atom_length = MAX_ATOM;
 
-    while (token_length != 0)
+    while (atom_length != 0)
     {
-      if (token_length < *min_token_length)
-        *min_token_length = token_length;
+      if (atom_length < *min_atom_length)
+        *min_atom_length = atom_length;
 
       state = automaton->root;
 
-      token_backtrack = *((int*) tokens_cursor);
-      tokens_cursor += sizeof(int);
+      atom_backtrack = *((int*) atoms_cursor);
+      atoms_cursor += sizeof(int);
 
-      for(i = 0; i < token_length; i++)
+      for(i = 0; i < atom_length; i++)
       {
         next_state = yr_ac_next_state(
             state,
-            *tokens_cursor);
+            *atoms_cursor);
 
         if (next_state == NULL)
         {
           next_state = _yr_ac_create_state(
               arena,
               state,
-              *tokens_cursor);
+              *atoms_cursor);
 
           if (next_state == NULL)
           {
-            yr_free(tokens);
+            yr_free(atoms);
             return ERROR_INSUFICIENT_MEMORY;
           }
         }
 
         state = next_state;
-        tokens_cursor++;
+        atoms_cursor++;
       }
 
-      token_length = *((int*) tokens_cursor);
-      tokens_cursor += sizeof(int);
+      atom_length = *((int*) atoms_cursor);
+      atoms_cursor += sizeof(int);
 
       result = yr_arena_allocate_struct(
           arena,
@@ -1053,7 +1056,7 @@ int yr_ac_add_string(
 
       if (result == ERROR_SUCCESS)
       {
-        new_match->backtrack = state->depth + token_backtrack;
+        new_match->backtrack = state->depth + atom_backtrack;
         new_match->string = string;
         new_match->next = state->matches;
         state->matches = new_match;
@@ -1065,7 +1068,7 @@ int yr_ac_add_string(
     }
   }
 
-  yr_free(tokens);
+  yr_free(atoms);
 
   return result;
 }
diff --git a/libyara/exec.c b/libyara/exec.c
index 7e66d12..9ac3b1d 100644
--- a/libyara/exec.c
+++ b/libyara/exec.c
@@ -101,69 +101,56 @@ int yr_execute_code(
         r1 = *(uint64_t*)(ip + 1);
         ip += sizeof(uint64_t);
         push(r1);
-        //printf("PUSH: %p\n", r1);
         break;
 
       case PUSH_A:
         push(rA);
-        //printf("PUSH_A: %p\n", rA);
         break;
 
       case POP_A:
         pop(rA);
-        //printf("POP_A: %p\n", rA);
         break;
 
       case PUSH_B:
         push(rB);
-        //printf("PUSH_B: %p\n", rB);
         break;
 
       case POP_B:
         pop(rB);
-        //printf("POP_B: %p\n", rB);
         break;
 
       case PUSH_C:
         push(rC);
-        //printf("PUSH_C: %p\n", rC);
         break;
 
       case POP_C:
         pop(rC);
-        //printf("POP_C: %p\n", rC);
         break;
 
       case CLEAR_B:
-        //printf("CLEAR_B\n");
         rB = 0;
         break;
 
       case CLEAR_C:
-        //printf("CLEAR_C\n");
         rC = 0;
         break;
 
       case INCR_A:
         pop(r1);
         rA += r1;
-        //printf("INCR_A A:%d\n", rA);
         break;
 
       case INCR_B:
         pop(r1);
         rB += r1;
-        //printf("INCR_B B:%d\n", rB);
         break;
 
       case INCR_C:
         pop(r1);
         rC += r1;
-        //printf("INCR_C C:%d\n", rC);
         break;
 
       case JLE_A_B:
-        //printf("JLE_A_B A:%d  B:%d\n", rA, rB);
         if (rA <= rB)
         {
           ip = *(uint8_t**)(ip + 1);
@@ -192,7 +179,6 @@ int yr_execute_code(
         break;
 
       case PNUNDEF_A_B:
-        //printf("PNUNDEF_A_B  %p\n", rA != UNDEFINED ? rA : rB);
         if (rA != UNDEFINED)
           push(rA);
         else
@@ -203,14 +189,12 @@ int yr_execute_code(
         pop(r2);
         pop(r1);
         push(r1 & r2);
-        //printf("AND %p %p\n", r1, r2);
         break;
 
       case OR:
         pop(r2);
         pop(r1);
         push(r1 | r2);
-        //printf("OR %p %p\n", r1, r2);
         break;
 
       case NOT:
@@ -222,21 +206,18 @@ int yr_execute_code(
         pop(r2);
         pop(r1);
         push(comparison(<, r1, r2));
-        //printf("LT %p %p\n", r1, r2);
         break;
 
       case GT:
         pop(r2);
         pop(r1);
         push(comparison(>, r1, r2));
-        //printf("GT %p %p\n", r1, r2);
         break;
 
       case LE:
         pop(r2);
         pop(r1);
         push(comparison(<=, r1, r2));
-        //printf("LE %p %p\n", r1, r2);
         break;
 
       case GE:
@@ -255,21 +236,18 @@ int yr_execute_code(
         pop(r2);
         pop(r1);
         push(comparison(!=, r1, r2));
-        //printf("NEQ %p %p %p\n", r1, r2, comparison(!=, r1, r2));
         break;
 
       case ADD:
         pop(r2);
         pop(r1);
         push(operation(+, r1, r2));
-        //printf("ADD %p %p %p\n", r1, r2, operation(+, r1, r2));
         break;
 
       case SUB:
         pop(r2);
         pop(r1);
         push(operation(-, r1, r2));
-        //printf("SUB %p %p %p\n", r1, r2, operation(-, r1, r2));
         break;
 
       case MUL:
@@ -317,7 +295,6 @@ int yr_execute_code(
         rule = *(RULE**)(ip + 1);
         ip += sizeof(uint64_t);
         push(rule->flags & RULE_FLAGS_MATCH ? 1 : 0);
-        //printf("RULE_PUSH %s %d\n", rule->identifier, rule->flags | RULE_FLAGS_MATCH ? 1 : 0);
         break;
 
       case RULE_POP:
@@ -326,7 +303,6 @@ int yr_execute_code(
         ip += sizeof(uint64_t);
         if (r1)
           rule->flags |= RULE_FLAGS_MATCH;
-        //printf("RULE_POP %s %d\n", rule->identifier, r1);
         break;
 
       case EXT_INT:
@@ -355,7 +331,6 @@ int yr_execute_code(
         pop(r1);
         string = UINT64_TO_PTR(STRING*, r1);
         push(string->flags & STRING_FLAGS_FOUND ? 1 : 0);
-        //printf("SFOUND %s %d\n", string->identifier, string->flags & STRING_FLAGS_FOUND? 1 : 0);
         break;
 
       case SFOUND_AT:
@@ -457,15 +432,12 @@ int yr_execute_code(
         i = 1;
         found = 0;
 
-        //printf("SOFFSET %s[%d] ", string->identifier, r1);
-
         while (match != NULL)
         {
           if (r1 >= i &&
               r1 <= i + match->last_offset - match->first_offset)
           {
             push(match->first_offset + r1 - i);
-            //printf("%d", match->first_offset + r1 - i);
             found = 1;
           }
 
@@ -476,14 +448,13 @@ int yr_execute_code(
         if (!found)
           push(UNDEFINED);
 
-        //printf("\n");
-
         break;
 
       case OF:
         found = 0;
         count = 0;
         pop(r1);
+
         while (r1 != UNDEFINED)
         {
           string = UINT64_TO_PTR(STRING*, r1);
@@ -492,11 +463,14 @@ int yr_execute_code(
           count++;
           pop(r1);
         }
+
         pop(r2);
+
         if (r2 != UNDEFINED)
           push(found >= r2 ? 1 : 0);
         else
           push(found >= count ? 1 : 0);
+
         break;
 
       case SIZE:
@@ -540,7 +514,8 @@ int yr_execute_code(
       case CONTAINS:
         pop(r2);
         pop(r1);
-        push(strstr(UINT64_TO_PTR(char*, r1), UINT64_TO_PTR(char*, r2)) != NULL);
+        push(strstr(UINT64_TO_PTR(char*, r1),
+                    UINT64_TO_PTR(char*, r2)) != NULL);
         break;
 
       case MATCHES:
diff --git a/libyara/mem.c b/libyara/mem.c
index 3193f0b..48a9aa0 100644
--- a/libyara/mem.c
+++ b/libyara/mem.c
@@ -52,13 +52,9 @@ void yr_free(void* ptr)
 
 char* yr_strdup(const char *s)
 {
-  size_t len;
-  char *r;
-
-  len = strlen(s);
-  r = yr_malloc(len + 1);
+  size_t len = strlen(s);
+  char *r = yr_malloc(len + 1);
   strcpy(r, s);
-
   return r;
 }
 
@@ -68,55 +64,74 @@ char* yr_strdup(const char *s)
 #include <string.h>
 #include <stdio.h>
 
+
+#ifdef DEBUG_HEAP
 static int count;
+#endif
 
 void yr_heap_alloc()
 {
+  #ifdef DEBUG_HEAP
   count = 0;
+  #endif
   return;
 }
 
 
 void yr_heap_free()
 {
+  #ifdef DEBUG_HEAP
   printf("malloc count: %d\n", count);
+  #endif
   return;
 }
 
 
 void* yr_malloc(size_t size)
 {
-  void* result;
+  void* result = malloc(size);
+
+  #ifdef DEBUG_HEAP
   count++;
-  result = malloc(size);
-  //printf("malloc: %p %d\n", result, size);
+  printf("malloc: %p %zd\n", result, size);
+  #endif
+
   return result;
 }
 
 
 void* yr_realloc(void* ptr, size_t size)
 {
-  void* result;
-  result = realloc(ptr, size);
-  //printf("realloc: %p -> %p\n", ptr, result);
+  void* result = realloc(ptr, size);
+
+  #ifdef DEBUG_HEAP
+  printf("realloc: %p -> %p\n", ptr, result);
+  #endif
+
   return result;
 }
 
 
 void yr_free(void *ptr)
 {
+  #ifdef DEBUG_HEAP
   count--;
-  //printf("free: %p\n", ptr);
+  printf("free: %p\n", ptr);
+  #endif
+
   free(ptr);
 }
 
 
 char* yr_strdup(const char *str)
 {
-  void* result;
+  void* result = strdup(str);
+
+  #ifdef DEBUG_HEAP
   count++;
-  result = strdup(str);
-  //printf("strdup: %p %d %s\n", result, strlen(str) + 1, str);
+  printf("strdup: %p %zd %s\n", result, strlen(str) + 1, str);
+  #endif
+
   return result;
 }
 

-- 
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/forensics/yara.git