Module `refinery.units.obfuscation.vba.dummies`

Expand source code Browse git

from __future__ import annotations

import collections
import re

from refinery.lib.patterns import formats
from refinery.units.obfuscation import Deobfuscator


class deob_vba_dummy_variables(Deobfuscator):
    def deobfuscate(self, data):
        lines = data.splitlines(keepends=False)
        names = collections.defaultdict(list)

        def might_be_used_in(name, line):
            # avoid finding the name within a string literal
            line = '""'.join(re.split(str(formats.ps1str), line))
            line = re.split(RF'\b{name}\b', line)
            try:
                L, R = line
            except ValueError:
                return False
            L = L.strip().lower()
            if L.startswith("'") or L.startswith('rem'):
                return False
            R = R.strip().lower()
            if R.startswith('=') and 'if' not in L:
                return False
            if L.startswith('dim'):
                return False
            return True

        pattern = re.compile(
            R'(?i)^\s{0,8}(?:const\s{1,8})?(\w+)\s{1,8}=\s{1,8}.*$'
        )

        for k, line in enumerate(lines):
            try:
                name = pattern.match(line)[1]
            except (AttributeError, TypeError):
                continue
            if re.search(r'\w+\(', line):
                # might be a function call
                continue
            names[name].append(k)

        for line in lines:
            while True:
                for name in names:
                    if might_be_used_in(name, line):
                        del names[name]
                        break
                else:
                    break

        return '\n'.join(line for k, line in enumerate(lines) if not any(
            k in rows for rows in names.values()))

Classes

class deob_vba_dummy_variables

Expand source code Browse git

class deob_vba_dummy_variables(Deobfuscator):
    def deobfuscate(self, data):
        lines = data.splitlines(keepends=False)
        names = collections.defaultdict(list)

        def might_be_used_in(name, line):
            # avoid finding the name within a string literal
            line = '""'.join(re.split(str(formats.ps1str), line))
            line = re.split(RF'\b{name}\b', line)
            try:
                L, R = line
            except ValueError:
                return False
            L = L.strip().lower()
            if L.startswith("'") or L.startswith('rem'):
                return False
            R = R.strip().lower()
            if R.startswith('=') and 'if' not in L:
                return False
            if L.startswith('dim'):
                return False
            return True

        pattern = re.compile(
            R'(?i)^\s{0,8}(?:const\s{1,8})?(\w+)\s{1,8}=\s{1,8}.*$'
        )

        for k, line in enumerate(lines):
            try:
                name = pattern.match(line)[1]
            except (AttributeError, TypeError):
                continue
            if re.search(r'\w+\(', line):
                # might be a function call
                continue
            names[name].append(k)

        for line in lines:
            while True:
                for name in names:
                    if might_be_used_in(name, line):
                        del names[name]
                        break
                else:
                    break

        return '\n'.join(line for k, line in enumerate(lines) if not any(
            k in rows for rows in names.values()))

Ancestors

Subclasses

deob_vba_dummy_variables

Class variables

var reverse: The type of the None singleton.

Methods

def deobfuscate(self, data)

Expand source code Browse git

def deobfuscate(self, data):
    lines = data.splitlines(keepends=False)
    names = collections.defaultdict(list)

    def might_be_used_in(name, line):
        # avoid finding the name within a string literal
        line = '""'.join(re.split(str(formats.ps1str), line))
        line = re.split(RF'\b{name}\b', line)
        try:
            L, R = line
        except ValueError:
            return False
        L = L.strip().lower()
        if L.startswith("'") or L.startswith('rem'):
            return False
        R = R.strip().lower()
        if R.startswith('=') and 'if' not in L:
            return False
        if L.startswith('dim'):
            return False
        return True

    pattern = re.compile(
        R'(?i)^\s{0,8}(?:const\s{1,8})?(\w+)\s{1,8}=\s{1,8}.*$'
    )

    for k, line in enumerate(lines):
        try:
            name = pattern.match(line)[1]
        except (AttributeError, TypeError):
            continue
        if re.search(r'\w+\(', line):
            # might be a function call
            continue
        names[name].append(k)

    for line in lines:
        while True:
            for name in names:
                if might_be_used_in(name, line):
                    del names[name]
                    break
            else:
                break

    return '\n'.join(line for k, line in enumerate(lines) if not any(
        k in rows for rows in names.values()))

Inherited members

Deobfuscator:
- FilterEverything
- Requires
- act
- assemble
- codec
- console
- filter
- finish
- handles
- is_quiet
- is_reversible
- isatty
- labelled
- leniency
- log_always
- log_debug
- log_detach
- log_fail
- log_info
- log_level
- log_warn
- logger
- name
- nozzle
- optional_dependencies
- read
- read1
- required_dependencies
- reset
- run
- source
- superinit
UnitBase:
- process