OSACA/osaca/osaca.py

#!/usr/bin/python

import argparse
import sys
import os
import io
import re
import subprocess
from param import Register, MemAddr, Parameter
from eu_sched import Scheduler
from testcase import Testcase
import pandas as pd
from datetime import datetime
import numpy as np


class Osaca(object):
    arch = None
    filepath = None
    srcCode = None
    df = None
    instr_forms = None
    # Variables for checking lines
    numSeps = 0
    indentChar = ''
    sem = 0
    marker = r'//STARTLOOP'

    # Variables for creating output
    longestInstr = 30
    # Constants
    ASM_LINE = re.compile(r'\s[0-9a-f]+[:]')
    # Matches every variation of the IACA start marker
    IACA_SM = re.compile(r'\s*movl[ \t]+\$111[ \t]*,[ \t]*%ebx[ \t]*\n\s*\.byte[ \t]+100[ \t]*'
                         + r'((,[ \t]*103[ \t]*((,[ \t]*144)|(\n\s*\.byte[ \t]+144)))|(\n\s*\.byte'
                         + r'[ \t]+103[ \t]*((,[ \t]*144)|(\n\s*\.byte[ \t]+144))))')
    # Matches every variation of the IACA end marker
    IACA_EM = re.compile(r'\s*movl[ \t]+\$222[ \t]*,[ \t]*%ebx[ \t]*\n\s*\.byte[ \t]+100[ \t]*'
                         + r'((,[ \t]*103[ \t]*((,[ \t]*144)|(\n\s*\.byte[ \t]+144)))|(\n\s*\.byte'
                         + r'[ \t]+103[ \t]*((,[ \t]*144)|(\n\s*\.byte[ \t]+144))))')

    def __init__(self, _arch, _filepath):
        self.arch = _arch
        self.filepath = _filepath
        self.instr_forms = []

    # -----------------main functions depending on arguments--------------------
    def include_ibench(self):
        """
        Reads ibench output and includes it in the architecture specific csv
        file.
        """
        # Check args and exit program if something's wrong
        if(not self.check_arch()):
            print('Invalid microarchitecture.')
            sys.exit()
        if(not self.check_file()):
            print('Invalid file path or file format.')
            sys.exit()
        # Check for database for the chosen architecture
        self.df = self.read_csv()
        # Create sequence of numbers and their reciprokals for validate the measurements
        cyc_list, reci_list = self.create_sequences()
        print('Everything seems fine! Let\'s start!')
        new_data = []
        added_vals = 0
        for line in self.srcCode:
            if('Using frequency' in line or len(line) == 0):
                continue
            clmn = 'LT'
            instr = line.split()[0][:-1]
            if('TP' in line):
                # We found a command with a throughput value. Get instruction and the number of
                # clock cycles and remove the '-TP' suffix.
                clmn = 'TP'
                instr = instr[:-3]
            # Otherwise it is a latency value. Nothing to do.
            clk_cyc = line.split()[1]
            clk_cyc_tmp = clk_cyc
            clk_cyc = self.validate_val(clk_cyc, instr, True if (clmn == 'TP') else False,
                                        cyc_list, reci_list)
            txt_output = True if (clk_cyc_tmp == clk_cyc) else False
            val = -2
            new = False
            try:
                entry = self.df.loc[lambda df, inst=instr: df.instr == inst, clmn]
                val = entry.values[0]
            except IndexError:
                # Instruction not in database yet --> add it
                new = True
                # First check if LT or TP value has already been added before
                for i, item in enumerate(new_data):
                    if(instr in item):
                        if(clmn == 'TP'):
                            new_data[i][1] = clk_cyc
                        elif(clmn == 'LT'):
                            new_data[i][2] = clk_cyc
                        new = False
                        break
                if(new and clmn == 'TP'):
                    new_data.append([instr, clk_cyc, '-1', ((-1,),)])
                elif(new and clmn == 'LT'):
                    new_data.append([instr, '-1', clk_cyc, ((-1,),)])
                new = True
                added_vals += 1
            # If val is -1 (= not filled with a valid value) add it immediately
            if(val == -1):
                self.df.set_value(entry.index[0], clmn, clk_cyc)
                added_vals += 1
                continue
            if(not new and abs((val/np.float64(clk_cyc))-1) > 0.05):
                print('Different measurement for {} ({}): {}(old) vs. '.format(instr, clmn, val)
                      + '{}(new)\nPlease check for correctness '.format(clk_cyc)
                      + '(no changes were made).')
                txt_output = True
            if(txt_output):
                print()
                txt_output = False
        # Now merge the DataFrames and write new csv file
        self.df = self.df.append(pd.DataFrame(new_data, columns=['instr', 'TP', 'LT', 'ports']),
                                 ignore_index=True)
        csv = self.df.to_csv(index=False)
        self.write_csv(csv)
        print('ibench output {} '.format(self.filepath.split('/')[-1])
              + 'successfully in database included.')
        print('{} values were added.'.format(added_vals))

    def inspect_binary(self):
        """
        Main function of OSACA. Inspect binary file and create analysis.
        """
        # Check args and exit program if something's wrong
        if(not self.check_arch()):
            print('Invalid microarchitecture.')
            sys.exit()
        if(not self.check_elffile()):
            print('Invalid file path or file format.')
            sys.exit()
        # Finally check for database for the chosen architecture
        self.read_csv()

        print('Everything seems fine! Let\'s start checking!')
        for i, line in enumerate(self.srcCode):
            if(i == 0):
                self.check_line(line, True)
            else:
                self.check_line(line)
        output = self.create_output()
        print(output)

    def inspect_with_iaca(self):
        """
        Main function of OSACA with IACA markers instead of OSACA marker.
        Inspect binary file and create analysis.
        """
        # Check args and exit program if something's wrong
        if(not self.check_arch()):
            print('Invalid microarchitecture.')
            sys.exit()
        # Check if input file is a binary or assembly file
        try:
            binary_file = True
            if(not self.check_elffile()):
                print('Invalid file path or file format.')
                sys.exit()
        except (TypeError, IndexError):
            binary_file = False
            if(not self.check_file(True)):
                print('Invalid file path or file format.')
                sys.exit()
        # Finally check for database for the chosen architecture
        self.read_csv()

        print('Everything seems fine! Let\'s start checking!')
        if(binary_file):
            self.iaca_bin()
        else:
            self.iaca_asm()
        output = self.create_output()
        print(output)

    # --------------------------------------------------------------------------

    def check_arch(self):
        """
        Check if the architecture is valid.

        Returns
        -------
        bool
            True    if arch is supported
            False   if arch is not supported

        """
        arch_list = ['SNB', 'IVB', 'HSW', 'BDW', 'SKL']
        if(self.arch in arch_list):
            return True
        else:
            return False

    def check_elffile(self):
        """
        Check if the given filepath exists, if the format is the needed elf64
        and store file data in attribute srcCode.

        Returns
        -------
        bool
            True    if file is expected elf64 file
            False   if file does not exist or is not an elf64 file

        """
        if(os.path.isfile(self.filepath)):
            self.store_src_code_elf()
            if('file format elf64' in self.srcCode[1]):
                return True
        return False

    def check_file(self, iaca_flag=False):
        """
        Check if the given filepath exists and store file data in attribute
        srcCode.

        Parameters
        ----------
        iaca_flag : bool
            store file data as a string in attribute srcCode if True,
            store it as a list of strings (lines) if False (default False)

        Returns
        -------
        bool
            True    if file exists
            False   if file does not exist

        """
        if(os.path.isfile(self.filepath)):
            self.store_src_code(iaca_flag)
            return True
        return False

    def store_src_code_elf(self):
        """
        Load binary file compiled with '-g' in class attribute srcCode and
        separate by line.
        """
        self.srcCode = (subprocess.run(['objdump', '--source', self.filepath],
                                       stdout=subprocess.PIPE).stdout.decode('utf-8').split('\n'))

    def store_src_code(self, iaca_flag=False):
        """
        Load arbitrary file in class attribute srcCode.

        Parameters
        ----------
        iaca_flag : bool
                store file data as a string in attribute srcCode if True,
                store it as a list of strings (lines) if False (default False)
        """
        try:
            f = open(self.filepath, 'r')
        except IOError:
            print('IOError: file \'{}\' not found'.format(self.filepath))
        self.srcCode = ''
        for line in f:
            self.srcCode += line
        f.close()
        if(iaca_flag):
            return
        self.srcCode = self.srcCode.split('\n')

    def read_csv(self):
        """
        Reads architecture dependent CSV from data directory.

        Returns
        -------
        DataFrame
            CSV as DataFrame object
        """
        curr_dir = '/'.join(os.path.realpath(__file__).split('/')[:-1])
        df = pd.read_csv(curr_dir+'/data/'+self.arch.lower()+'_data.csv')
        return df

    def write_csv(self, csv):
        """
        Writes architecture dependent CSV into data directory.

        Parameters
        ----------
        csv : str
            CSV data as string
        """
        try:
            f = open('data/'+self.arch.lower()+'_data.csv', 'w')
        except IOError:
            print('IOError: file \'{}\' not found in ./data'.format(self.arch.lower()+'_data.csv'))
        f.write(csv)
        f.close()

    def create_sequences(self, end=101):
        """
        Creates list of integers from 1 to end and list of their reciprocals.

        Parameters
        ----------
        end : int
            End value for list of integers (default 101)

        Returns
        -------
        [int]
            cyc_list of integers
        [float]
            reci_list of floats
        """
        cyc_list = []
        reci_list = []
        for i in range(1, end):
            cyc_list.append(i)
            reci_list.append(1/i)
        return cyc_list, reci_list

    def validate_val(self, clk_cyc, instr, is_tp, cyc_list, reci_list):
        """
        Validate given clock cycle clk_cyc and return rounded value in case of
        success.

        A succeeded validation means the clock cycle clk_cyc is only 5% higher or
        lower than an integer value from cyc_list or - if clk_cyc is a throughput
        value - 5% higher or lower than a reciprocal from the reci_list.

        Parameters
        ----------
        clk_cyc : float
            Clock cycle to validate
        instr : str
            Instruction for warning output
        is_tp : bool
            True if a throughput value is to check, False for a latency value
        cyc_list : [int]
            Cycle list for validating
        reci_list : [float]
            Reciprocal cycle list for validating

        Returns
        -------
        float
            Clock cycle, either rounded to an integer or its reciprocal or the
            given clk_cyc parameter
        """
        clmn = 'LT'
        if(is_tp):
            clmn = 'TP'
        for i in range(0, len(cyc_list)):
            if(cyc_list[i]*1.05 > float(clk_cyc) and cyc_list[i]*0.95 < float(clk_cyc)):
                # Value is probably correct, so round it to the estimated value
                return cyc_list[i]
            # Check reciprocal only if it is a throughput value
            elif(is_tp and reci_list[i]*1.05 > float(clk_cyc)
                 and reci_list[i]*0.95 < float(clk_cyc)):
                # Value is probably correct, so round it to the estimated value
                return reci_list[i]
        # No value close to an integer or its reciprocal found, we assume the
        # measurement is incorrect
        print('Your measurement for {} ({}) is probably wrong. '.format(instr, clmn)
              + 'Please inspect your benchmark!')
        print('The program will continue with the given value')
        return clk_cyc

    def check_line(self, line, first_appearance=False):
        """
        Inspect line of source code and process it if inside the marked snippet.

        Parameter
        ---------
        line : str
            Line of source code
        first_appearance : bool
            Necessary for setting indenting character (default False)
        """
        # Check if marker is in line
        if(self.marker in line):
            # First, check if high level code in indented with whitespaces or tabs
            if(first_appearance):
                self.indentChar = self.get_indent_chars(line)
            # Now count the number of whitespaces
            self.numSeps = (re.split(self.marker, line)[0]).count(self.indentChar)
            self.sem = 2
        elif(self.sem > 0):
            # We're in the marked code snippet
            # Check if the line is ASM code and - if not - check if we're still in the loop
            match = re.search(self.ASM_LINE, line)
            if(match):
                # Further analysis of instructions
                # Check if there are comments in line
                if(r'//' in line):
                    return
                self.check_instr(''.join(re.split(r'\t', line)[-1:]))
            elif((re.split(r'\S', line)[0]).count(self.indentChar) <= self.numSeps):
                # Not in the loop anymore - or yet. We decrement the semaphore
                self.sem = self.sem-1

    def get_indent_chars(self, line):
        """
        Check if indentation characters are either tabulators or whitespaces

        Parameters
        ----------
        line : str
            Line with start marker in it

        Returns
        -------
        str
            Indentation character as string
        """
        num_spaces = (re.split(self.marker, line)[0]).count(' ')
        num_tabs = (re.split(self.marker, line)[0]).count('\t')
        if(num_spaces != 0 and num_tabs == 0):
            return ' '
        elif(num_spaces == 0 and num_tabs != 0):
            return '\t'
        else:
            err_msg = 'Indentation of code is only supported for whitespaces and tabs.'
            raise NotImplementedError(err_msg)

    def iaca_bin(self):
        """
        Extract instruction forms out of binary file using IACA markers.
        """
        self.marker = r'fs addr32 nop'
        for line in self.srcCode:
            # Check if marker is in line
            if(self.marker in line):
                self.sem += 1
            elif(self.sem == 1):
                # We're in the marked code snippet
                # Check if the line is ASM code
                match = re.search(self.ASM_LINE, line)
                if(match):
                    # Further analysis of instructions
                    # Check if there are comments in line
                    if(r'//' in line):
                        continue
                    # Do the same instruction check as for the OSACA marker line check
                    self.check_instr(''.join(re.split(r'\t', line)[-1:]))
            elif(self.sem == 2):
                # Not in the loop anymore. Due to the fact it's the IACA marker we can stop here
                # After removing the last line which belongs to the IACA marker
                del self.instr_forms[-1:]
                return

    def iaca_asm(self):
        """
        Extract instruction forms out of assembly file using IACA markers.
        """
        # Extract the code snippet surround by the IACA markers
        code = self.srcCode
        # Search for the start marker
        match = re.match(self.IACA_SM, code)
        while(not match):
            code = code.split('\n', 1)[1]
            match = re.match(self.IACA_SM, code)
        # Search for the end marker
        code = (code.split('144', 1)[1]).split('\n', 1)[1]
        res = ''
        match = re.match(self.IACA_EM, code)
        while(not match):
            res += code.split('\n', 1)[0]+'\n'
            code = code.split('\n', 1)[1]
            match = re.match(self.IACA_EM, code)
        # Split the result by line go on like with OSACA markers
        res = res.split('\n')
        for line in res:
            line = line.split('#')[0]
            line = line.lstrip()
            if(len(line) == 0 or '//' in line or line.startswith('..')):
                continue
            self.check_instr(line)

    def check_instr(self, instr):
        """
        Inspect instruction for its parameters and add it to the instruction forms
        pool instr_form.

        Parameters
        ----------
        instr : str
            Instruction as string
        """
        # Check for strange clang padding bytes
        while(instr.startswith('data32')):
            instr = instr[7:]
        # Separate mnemonic and operands
        mnemonic = instr.split()[0]
        params = ''.join(instr.split()[1:])
        # Check if line is not only a byte
        empty_byte = re.compile(r'[0-9a-f]{2}')
        if(re.match(empty_byte, mnemonic) and len(mnemonic) == 2):
            return
        # Check if there's one or more operands and store all in a list
        param_list = self.flatten(self.separate_params(params))
        param_list_types = list(param_list)
        # Check operands and separate them by IMMEDIATE (IMD), REGISTER (REG),
        # MEMORY (MEM) or LABEL(LBL)
        for i in range(len(param_list)):
            op = param_list[i]
            if(len(op) <= 0):
                op = Parameter('NONE')
            elif(op[0] == '$'):
                op = Parameter('IMD')
            elif(op[0] == '%' and '(' not in op):
                j = len(op)
                opmask = False
                if('{' in op):
                    j = op.index('{')
                    opmask = True
                op = Register(op[1:j], opmask)
            elif('<' in op or op.startswith('.')):
                op = Parameter('LBL')
            else:
                op = MemAddr(op)
            param_list[i] = str(op)
            param_list_types[i] = op
        # Add to list
        if(len(instr) > self.longestInstr):
            self.longestInstr = len(instr)
        instr_form = [mnemonic]+list(reversed(param_list_types))+[instr]
        self.instr_forms.append(instr_form)
        # If flag is set, create testcase for instruction form
        # Do this in reversed param list order, du to the fact it's intel syntax
        # Only create benchmark if no label (LBL) is part of the operands
        if('LBL' in param_list or '' in param_list):
            return
        tc = Testcase(mnemonic, list(reversed(param_list_types)), '64')
        # Only write a testcase if it not already exists
        writeTP, writeLT = tc.is_in_dir()
        tc.write_testcase(not writeTP, not writeLT)

    def separate_params(self, params):
        """
        Delete comments, separates parameters and return them as a list.

        Parameters
        ----------
        params : str
            Splitted line after mnemonic

        Returns
        -------
        [[...[str]]]
            Nested list of strings. The number of nest levels depend on the
            number of parametes given.
        """
        param_list = [params]
        if(',' in params):
            if(')' in params):
                if(params.index(')') < len(params)-1 and params[params.index(')')+1] == ','):
                    i = params.index(')')+1
                elif(params.index('(') < params.index(',')):
                    return param_list
                else:
                    i = params.index(',')
            else:
                i = params.index(',')
            param_list = [params[:i], self.separate_params(params[i+1:])]
        elif('#' in params):
            i = params.index('#')
            param_list = [params[:i]]
        return param_list

    def flatten(self, l):
        """
        Flatten a nested list of strings.

        Parameters
        ----------
        l : [[...[str]]]
            Nested list of strings

        Returns
        -------
        [str]
            List of strings
        """
        if l == []:
            return l
        if(isinstance(l[0], list)):
            return self.flatten(l[0]) + self.flatten(l[1:])
        return l[:1] + self.flatten(l[1:])

    def create_output(self, tp_list=False, pr_sched=True):
        """
        Creates output of analysed file including a time stamp.

        Parameters
        ----------
        tp_list : bool
            Boolean for indicating the need for the throughput list as output
            (default False)
        pr_sched : bool
            Boolean for indicating the need for predicting a scheduling
            (default True)

        Returns
        -------
        str
            OSACA output
        """
        # Check the output alignment depending on the longest instruction
        if(self.longestInstr > 70):
            self.longestInstr = 70
        horiz_line = self.create_horiz_sep()
        # Write general information about the benchmark
        output = ('--' + horiz_line + '\n'
                  + '| Analyzing of file:\t' + os.path.abspath(self.filepath) + '\n'
                  + '| Architecture:\t\t' + self.arch + '\n'
                  + '| Timestamp:\t\t' + datetime.now().strftime('%Y-%m-%d %H:%M:%S') + '\n')
        if(tp_list):
            output += self.create_tp_list(horiz_line)
        if(pr_sched):
            output += '\n\n'
            sched = Scheduler(self.arch, self.instr_forms)
            sched_output, port_binding = sched.schedule()
            binding = sched.get_port_binding(port_binding)
            output += sched.get_report_info() + '\n' + binding + '\n\n' + sched_output
            block_tp = round(max(port_binding), 2)
            output += 'Total number of estimated throughput: ' + str(block_tp)
        return output

    def create_horiz_sep(self):
        """
        Calculate and return horizontal separator line.

        Returns
        -------
        str
            Horizontal separator line
        """
        return '-'*(self.longestInstr+8)

    def create_tp_list(self, horiz_line):
        """
        Create list of instruction forms with the proper throughput value.

        Parameter
        ---------
        horiz_line : str
            Calculated horizontal line for nice alignement

        Returns
        -------
        str
            Throughput list output for printing
        """
        warning = False
        ws = ' '*(len(horiz_line)-23)

        output = ('\n| INSTRUCTION' + ws + 'CLOCK CYCLES\n'
                  + '| ' + horiz_line + '\n|\n')
        # Check for the throughput data in CSV
        for elem in self.instr_forms:
            op_ext = []
            for i in range(1, len(elem)-1):
                optmp = ''
                if(isinstance(elem[i], Register) and elem[i].reg_type == 'GPR'):
                    optmp = 'r'+str(elem[i].size)
                elif(isinstance(elem[i], MemAddr)):
                    optmp = 'mem'
                else:
                    optmp = str(elem[i]).lower()
                op_ext.append(optmp)
            operands = '_'.join(op_ext)
            # Now look up the value in the dataframe
            # Check if there is a stored throughput value in database
            import warnings
            warnings.filterwarnings("ignore", 'This pattern has match groups')
            series = self.df['instr'].str.contains(elem[0] + '-' + operands)
            if(True in series.values):
                # It's a match!
                not_found = False
                try:
                    tp = self.df[self.df.instr == elem[0] + '-' + operands].TP.values[0]
                except IndexError:
                    # Something went wrong
                    print('Error while fetching data from database')
                    continue
            # Did not found the exact instruction form.
            # Try to find the instruction form for register operands only
            else:
                op_ext_regs = []
                for operand in op_ext:
                    try:
                        # regTmp = Register(operand)
                        # Create Register only to see if it is one
                        Register(operand)
                        op_ext_regs.append(True)
                    except KeyError:
                        op_ext_regs.append(False)
                if(True not in op_ext_regs):
                    # No register in whole instr form. How can I find out what regsize we need?
                    print('Feature not included yet: ', end='')
                    print(elem[0]+' for '+operands)
                    tp = 0
                    not_found = True
                    warning = True
                    num_whitespaces = self.longestInstr-len(elem[-1])
                    ws = ' ' * num_whitespaces + '|  '
                    n_f = ' ' * (5 - len(str(tp))) + '*'
                    data = '| ' + elem[-1] + ws + str(tp) + n_f + '\n'
                    output += data
                    continue
                if(op_ext_regs[0] is False):
                    # Instruction stores result in memory. Check for storing in register instead.
                    if(len(op_ext) > 1):
                        if(op_ext_regs[1] is True):
                            op_ext[0] = op_ext[1]
                        elif(len(op_ext > 2)):
                            if(op_ext_regs[2] is True):
                                op_ext[0] = op_ext[2]
                if(len(op_ext_regs) == 2 and op_ext_regs[1] is False):
                    # Instruction loads value from memory and has only two operands. Check for
                    # loading from register instead
                    if(op_ext_regs[0] is True):
                        op_ext[1] = op_ext[0]
                if(len(op_ext_regs) == 3 and op_ext_regs[2] is False):
                    # Instruction loads value from memory and has three operands. Check for loading
                    # from register instead
                    op_ext[2] = op_ext[0]
                operands = '_'.join(op_ext)
                # Check for register equivalent instruction
                series = self.df['instr'].str.contains(elem[0]+'-'+operands)
                if(True in series.values):
                    # It's a match!
                    not_found = False
                    try:
                        tp = self.df[self.df.instr == elem[0]+'-'+operands].TP.values[0]
                    except IndexError:
                        # Something went wrong
                        print('Error while fetching data from database')
                        continue
                # Did not found the register instruction form. Set warning and go on with
                # throughput 0
                else:
                    tp = 0
                    not_found = True
                    warning = True
            # Check the alignement again
            num_whitespaces = self.longestInstr - len(elem[-1])
            ws = ' ' * num_whitespaces + '|  '
            n_f = ''
            if(not_found):
                n_f = ' ' * (5 - len(str(tp))) + '*'
            data = '| ' + elem[-1] + ws + '{:3.2f}'.format(tp) + n_f + '\n'
            output += data
        # Finally end the list of  throughput values
        num_whitespaces = self.longestInstr - 27
        ws = '  ' + ' ' * num_whitespaces
        output += '| ' + horiz_line + '\n'
        if(warning):
            output += ('\n\n* There was no throughput value found '
                       'for the specific instruction form.'
                       '\n  Please create a testcase via the create_testcase-method '
                       'or add a value manually.')
        return output


# ------------------------------------------------------------------------------
# Stolen from pip
def __read(*names, **kwargs):
    with io.open(
        os.path.join(os.path.dirname(__file__), *names),
        encoding=kwargs.get("encoding", "utf8")
    ) as fp:
        return fp.read()


# Stolen from pip
def __find_version(*file_paths):
    version_file = __read(*file_paths)
    version_match = re.search(r"^__version__ = ['\"]([^'\"]*)['\"]", version_file, re.M)
    if version_match:
        return version_match.group(1)
    raise RuntimeError('Unable to find version string.')


# ------------Main method--------------
def main():
    # Parse args
    parser = argparse.ArgumentParser(description='Analyzes a marked innermost loop snippet'
                                     + 'for a given architecture type and prints out the estimated'
                                     + 'average throughput.')
    parser.add_argument('-V', '--version', action='version', version='%(prog)s '
                        + __find_version('__init__.py'))
    parser.add_argument('--arch', dest='arch', type=str, help='define architecture '
                                                              + '(SNB, IVB, HSW, BDW, SKL)')
    parser.add_argument('filepath', type=str, help='path to object (Binary, ASM, CSV)')
    group = parser.add_mutually_exclusive_group(required=False)
    group.add_argument('-i', '--include-ibench', dest='incl', action='store_true',
                       help='includes the given values in form of the output of ibench in the'
                            + 'database')
    group.add_argument('--iaca', dest='iaca', action='store_true',
                       help='search for IACA markers instead the OSACA marker')
    group.add_argument('-m', '--insert-marker', dest='insert_marker', action='store_true',
                       help='try to find blocks probably corresponding to loops in assembly and'
                       + 'insert IACA marker')

    # Store args in global variables
    inp = parser.parse_args()
    if(inp.arch is None and inp.insert_marker is None):
        raise ValueError('Please specify an architecture')
    if(inp.arch is not None):
        arch = inp.arch.upper()
    filepath = inp.filepath
    incl_ibench = inp.incl
    iaca_flag = inp.iaca
    insert_m = inp.insert_marker

    # Create Osaca object
    if(inp.arch is not None):
        osaca = Osaca(arch, filepath)

    if(incl_ibench):
        osaca.include_ibench()
    elif(iaca_flag):
        osaca.inspect_with_iaca()
    elif(insert_m):
        try:
            from kerncraft import iaca
        except ImportError:
            print('ImportError: Module kerncraft not installed. Use '
                  + '\'pip install --user kerncraft\' for installation.\nFor more information see '
                  + 'https://github.com/RRZE-HPC/kerncraft')
            sys.exit()
        iaca.iaca_instrumentation(input_file=filepath, output_file=filepath,
                                  block_selection='manual', pointer_increment=1)
    else:
        osaca.inspect_binary()


# ------------Main method--------------
if __name__ == '__main__':
    main()