src/arch/x86/isa/specialize.isa - public/gem5 - Git at Google

 // -*- mode:c++ -*-

 // Copyright (c) 2007 The Hewlett-Packard Development Company
 // All rights reserved.
 //
 // The license below extends only to copyright in the software and shall
 // not be construed as granting a license to any other intellectual
 // property including but not limited to intellectual property relating
 // to a hardware implementation of the functionality of the software
 // licensed hereunder.  You may use the software subject to the license
 // terms below provided that you ensure that this notice is replicated
 // unmodified and in its entirety in all distributions of the software,
 // modified or unmodified, in source code or in binary form.
 //
 // Redistribution and use in source and binary forms, with or without
 // modification, are permitted provided that the following conditions are
 // met: redistributions of source code must retain the above copyright
 // notice, this list of conditions and the following disclaimer;
 // redistributions in binary form must reproduce the above copyright
 // notice, this list of conditions and the following disclaimer in the
 // documentation and/or other materials provided with the distribution;
 // neither the name of the copyright holders nor the names of its
 // contributors may be used to endorse or promote products derived from
 // this software without specific prior written permission.
 //
 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 ////////////////////////////////////////////////////////////////////
 //
 //  Code to "specialize" a microcode sequence to use a particular
 //  variety of operands
 //

 let {{
     # This code builds up a decode block which decodes based on switchval.
     # vals is a dict which matches case values with what should be decoded to.
     # Each element of the dict is a list containing a function and then the
     # arguments to pass to it.
     def doSplitDecode(switchVal, vals, default = None):
         blocks = OutputBlocks()
         blocks.decode_block = 'switch(%s) {\n' % switchVal
         for (val, todo) in vals.items():
             new_blocks = todo[0](*todo[1:])
             new_blocks.decode_block = \
                 '\tcase %s: %s\n' % (val, new_blocks.decode_block)
             blocks.append(new_blocks)
         if default:
             new_blocks = default[0](*default[1:])
             new_blocks.decode_block = \
                 '\tdefault: %s\n' % new_blocks.decode_block
             blocks.append(new_blocks)
         blocks.decode_block += '}\n'
         return blocks
 }};

 let {{
     def doRipRelativeDecode(Name, opTypes, env):
         # print "RIPing %s with opTypes %s" % (Name, opTypes)
         env.memoryInst = True
         normEnv = copy.copy(env)
         normEnv.addToDisassembly(
                 '''printMem(out, env.seg, env.scale, env.index, env.base,
                     machInst.displacement, env.addressSize, false);''')
         normBlocks = specializeInst(Name + "_M", copy.copy(opTypes), normEnv)
         ripEnv = copy.copy(env)
         ripEnv.addToDisassembly(
                 '''printMem(out, env.seg, 1, 0, 0,
                     machInst.displacement, env.addressSize, true);''')
         ripBlocks = specializeInst(Name + "_P", copy.copy(opTypes), ripEnv)

         blocks = OutputBlocks()
         blocks.append(normBlocks)
         blocks.append(ripBlocks)

         blocks.decode_block = '''
         if(machInst.modRM.mod == 0 &&
           machInst.modRM.rm == 5 &&
           machInst.mode.submode == SixtyFourBitMode)
         { %s }
         else
         { %s }''' % \
          (ripBlocks.decode_block, normBlocks.decode_block)
         return blocks
 }};

 let {{
     def doBadInstDecode():
         blocks = OutputBlocks()
         blocks.decode_block = '''
         return new Unknown(machInst);
         '''
         return blocks
 }};

 let {{
     class OpType(object):
         parser = re.compile(r"(?P<tag>[A-Z]+)(?P<size>[a-z]*)|(r(?P<reg>[A-Z0-9]+)(?P<rsize>[a-z]*))")
         def __init__(self, opTypeString):
             match = OpType.parser.search(opTypeString)
             if match == None:
                 raise Exception("Problem parsing operand type {}".format(
                     opTypeString))
             self.reg = match.group("reg")
             self.tag = match.group("tag")
             self.size = match.group("size")
             if not self.size:
                 self.size = match.group("rsize")

     ModRMRegIndex = "(MODRM_REG | (REX_R << 3))"
     ModRMRMIndex = "(MODRM_RM | (REX_B << 3))"
     InstRegIndex = "(OPCODE_OP_BOTTOM3 | (REX_B << 3))"

     # This function specializes the given piece of code to use a particular
     # set of argument types described by "opTypes".
     def specializeInst(Name, opTypes, env):
         # print "Specializing %s with opTypes %s" % (Name, opTypes)
         while len(opTypes):
             # Parse the operand type string we're working with
             opType = OpType(opTypes[0])
             opTypes.pop(0)

             if opType.tag not in ("I", "J", "P", "PR", "Q", "V", "VR", "W"):
                 if opType.size:
                     env.setSize(opType.size)

             if opType.reg:
                 #Figure out what to do with fixed register operands
                 #This is the index to use, so we should stick it some place.
                 if opType.reg in ("A", "B", "C", "D"):
                     regString = "INTREG_R%sX" % opType.reg
                 else:
                     regString = "INTREG_R%s" % opType.reg
                 env.addReg(regString)
                 env.addToDisassembly(
                     "printReg(out, InstRegIndex(%s), regSize);\n" %
                                                                      regString)

                 Name += "_R"

             elif opType.tag == "B":
                 # This refers to registers whose index is encoded as part of the opcode
                 env.addToDisassembly(
                         "printReg(out, InstRegIndex(%s), regSize);\n" %
                                                                   InstRegIndex)

                 Name += "_R"

                 env.addReg(InstRegIndex)
             elif opType.tag == "M":
                 # This refers to memory. The macroop constructor sets up modrm
                 # addressing. Non memory modrm settings should cause an error.
                 env.doModRM = True
                 return doSplitDecode("MODRM_MOD",
                         {"3" : (doBadInstDecode,) },
                         (doRipRelativeDecode, Name, opTypes, env))
             elif opType.tag == None or opType.size == None:
                 raise Exception("Problem parsing operand tag: {}".format(
                     opType.tag))
             elif opType.tag == "C":
                 # A control register indexed by the "reg" field
                 env.addReg(ModRMRegIndex)
                 env.addToDisassembly(
                         "ccprintf(out, \"CR%%d\", %s);\n" % ModRMRegIndex)
                 Name += "_C"
             elif opType.tag == "D":
                 # A debug register indexed by the "reg" field
                 env.addReg(ModRMRegIndex)
                 env.addToDisassembly(
                         "ccprintf(out, \"DR%%d\", %s);\n" % ModRMRegIndex)
                 Name += "_D"
             elif opType.tag == "S":
                 # A segment selector register indexed by the "reg" field
                 env.addReg(ModRMRegIndex)
                 env.addToDisassembly(
                         "printSegment(out, %s);\n" % ModRMRegIndex)
                 Name += "_S"
             elif opType.tag in ("G", "P", "T", "V"):
                 # Use the "reg" field of the ModRM byte to select the register
                 env.addReg(ModRMRegIndex)
                 env.addToDisassembly(
                         "printReg(out, InstRegIndex(%s), regSize);\n" %
                                                                  ModRMRegIndex)

                 if opType.tag == "P":

                     Name += "_MMX"
                 elif opType.tag == "V":
                     Name += "_XMM"
                 else:
                     Name += "_R"
             elif opType.tag in ("E", "Q", "W"):
                 # This might refer to memory or to a register. We need to
                 # divide it up farther.
                 regEnv = copy.copy(env)
                 regEnv.addReg(ModRMRMIndex)
                 regEnv.addToDisassembly(
                         "printReg(out, InstRegIndex(%s), regSize);\n" %
                                                                   ModRMRMIndex)

                 # This refers to memory. The macroop constructor should set up

                 # modrm addressing.
                 memEnv = copy.copy(env)
                 memEnv.doModRM = True
                 regSuffix = "_R"
                 if opType.tag == "Q":
                     regSuffix = "_MMX"
                 elif opType.tag == "W":
                     regSuffix = "_XMM"
                 return doSplitDecode("MODRM_MOD",
                     {"3" : (specializeInst, Name + regSuffix,
                             copy.copy(opTypes), regEnv)},
                            (doRipRelativeDecode, Name,
                             copy.copy(opTypes), memEnv))
             elif opType.tag in ("I", "J"):
                 # Immediates
                 env.addToDisassembly(
                         "ccprintf(out, \"%#x\", machInst.immediate);\n")
                 Name += "_I"
             elif opType.tag == "O":
                 # Immediate containing a memory offset
                 Name += "_MI"
             elif opType.tag in ("PR", "R", "VR"):
                 # Non register modrm settings should cause an error
                 env.addReg(ModRMRMIndex)
                 env.addToDisassembly(
                         "printReg(out, InstRegIndex(%s), regSize);\n" %
                                                                   ModRMRMIndex)

                 if opType.tag == "PR":

                     Name += "_MMX"
                 elif opType.tag == "VR":
                     Name += "_XMM"
                 else:
                     Name += "_R"
             elif opType.tag in ("X", "Y"):
                 # This type of memory addressing is for string instructions.
                 # They'll use the right index and segment internally.
                 if opType.tag == "X":
                     env.addToDisassembly(
                             '''printMem(out, env.seg,
                                 1, X86ISA::ZeroReg, X86ISA::INTREG_RSI, 0,
                                 env.addressSize, false);''')
                 else:
                     env.addToDisassembly(
                             '''printMem(out, SEGMENT_REG_ES,
                                 1, X86ISA::ZeroReg, X86ISA::INTREG_RDI, 0,
                                 env.addressSize, false);''')
                 Name += "_M"
             else:
                 raise Exception("Unrecognized tag {}.".format(opType.tag))

         # Generate code to return a macroop of the given name which will
         # operate in the "emulation environment" env
         return genMacroop(Name, env)
 }};
	// -- mode:c++ --

	// Copyright (c) 2007 The Hewlett-Packard Development Company
	// All rights reserved.
	//
	// The license below extends only to copyright in the software and shall
	// not be construed as granting a license to any other intellectual
	// property including but not limited to intellectual property relating
	// to a hardware implementation of the functionality of the software
	// licensed hereunder. You may use the software subject to the license
	// terms below provided that you ensure that this notice is replicated
	// unmodified and in its entirety in all distributions of the software,
	// modified or unmodified, in source code or in binary form.
	//
	// Redistribution and use in source and binary forms, with or without
	// modification, are permitted provided that the following conditions are
	// met: redistributions of source code must retain the above copyright
	// notice, this list of conditions and the following disclaimer;
	// redistributions in binary form must reproduce the above copyright
	// notice, this list of conditions and the following disclaimer in the
	// documentation and/or other materials provided with the distribution;
	// neither the name of the copyright holders nor the names of its
	// contributors may be used to endorse or promote products derived from
	// this software without specific prior written permission.
	//
	// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

	////////////////////////////////////////////////////////////////////
	//
	// Code to "specialize" a microcode sequence to use a particular
	// variety of operands
	//

	let {{
	# This code builds up a decode block which decodes based on switchval.
	# vals is a dict which matches case values with what should be decoded to.
	# Each element of the dict is a list containing a function and then the
	# arguments to pass to it.
	def doSplitDecode(switchVal, vals, default = None):
	blocks = OutputBlocks()
	blocks.decode_block = 'switch(%s) {\n' % switchVal
	for (val, todo) in vals.items():
	new_blocks = todo[0](*todo[1:])
	new_blocks.decode_block = \
	'\tcase %s: %s\n' % (val, new_blocks.decode_block)
	blocks.append(new_blocks)
	if default:
	new_blocks = default[0](*default[1:])
	new_blocks.decode_block = \
	'\tdefault: %s\n' % new_blocks.decode_block
	blocks.append(new_blocks)
	blocks.decode_block += '}\n'
	return blocks
	}};

	let {{
	def doRipRelativeDecode(Name, opTypes, env):
	# print "RIPing %s with opTypes %s" % (Name, opTypes)
	env.memoryInst = True
	normEnv = copy.copy(env)
	normEnv.addToDisassembly(
	'''printMem(out, env.seg, env.scale, env.index, env.base,
	machInst.displacement, env.addressSize, false);''')
	normBlocks = specializeInst(Name + "_M", copy.copy(opTypes), normEnv)
	ripEnv = copy.copy(env)
	ripEnv.addToDisassembly(
	'''printMem(out, env.seg, 1, 0, 0,
	machInst.displacement, env.addressSize, true);''')
	ripBlocks = specializeInst(Name + "_P", copy.copy(opTypes), ripEnv)

	blocks = OutputBlocks()
	blocks.append(normBlocks)
	blocks.append(ripBlocks)

	blocks.decode_block = '''
	if(machInst.modRM.mod == 0 &&
	machInst.modRM.rm == 5 &&
	machInst.mode.submode == SixtyFourBitMode)
	{ %s }
	else
	{ %s }''' % \
	(ripBlocks.decode_block, normBlocks.decode_block)
	return blocks
	}};

	let {{
	def doBadInstDecode():
	blocks = OutputBlocks()
	blocks.decode_block = '''
	return new Unknown(machInst);
	'''
	return blocks
	}};

	let {{
	class OpType(object):
	parser = re.compile(r"(?P<tag>[A-Z]+)(?P<size>[a-z])\|(r(?P<reg>[A-Z0-9]+)(?P<rsize>[a-z]))")
	def __init__(self, opTypeString):
	match = OpType.parser.search(opTypeString)
	if match == None:
	raise Exception("Problem parsing operand type {}".format(
	opTypeString))
	self.reg = match.group("reg")
	self.tag = match.group("tag")
	self.size = match.group("size")
	if not self.size:
	self.size = match.group("rsize")

	ModRMRegIndex = "(MODRM_REG \| (REX_R << 3))"
	ModRMRMIndex = "(MODRM_RM \| (REX_B << 3))"
	InstRegIndex = "(OPCODE_OP_BOTTOM3 \| (REX_B << 3))"

	# This function specializes the given piece of code to use a particular
	# set of argument types described by "opTypes".
	def specializeInst(Name, opTypes, env):
	# print "Specializing %s with opTypes %s" % (Name, opTypes)
	while len(opTypes):
	# Parse the operand type string we're working with
	opType = OpType(opTypes[0])
	opTypes.pop(0)

	if opType.tag not in ("I", "J", "P", "PR", "Q", "V", "VR", "W"):
	if opType.size:
	env.setSize(opType.size)

	if opType.reg:
	#Figure out what to do with fixed register operands
	#This is the index to use, so we should stick it some place.
	if opType.reg in ("A", "B", "C", "D"):
	regString = "INTREG_R%sX" % opType.reg
	else:
	regString = "INTREG_R%s" % opType.reg
	env.addReg(regString)
	env.addToDisassembly(
	"printReg(out, InstRegIndex(%s), regSize);\n" %
	regString)

	Name += "_R"

	elif opType.tag == "B":
	# This refers to registers whose index is encoded as part of the opcode
	env.addToDisassembly(
	"printReg(out, InstRegIndex(%s), regSize);\n" %
	InstRegIndex)

	Name += "_R"

	env.addReg(InstRegIndex)
	elif opType.tag == "M":
	# This refers to memory. The macroop constructor sets up modrm
	# addressing. Non memory modrm settings should cause an error.
	env.doModRM = True
	return doSplitDecode("MODRM_MOD",
	{"3" : (doBadInstDecode,) },
	(doRipRelativeDecode, Name, opTypes, env))
	elif opType.tag == None or opType.size == None:
	raise Exception("Problem parsing operand tag: {}".format(
	opType.tag))
	elif opType.tag == "C":
	# A control register indexed by the "reg" field
	env.addReg(ModRMRegIndex)
	env.addToDisassembly(
	"ccprintf(out, \"CR%%d\", %s);\n" % ModRMRegIndex)
	Name += "_C"
	elif opType.tag == "D":
	# A debug register indexed by the "reg" field
	env.addReg(ModRMRegIndex)
	env.addToDisassembly(
	"ccprintf(out, \"DR%%d\", %s);\n" % ModRMRegIndex)
	Name += "_D"
	elif opType.tag == "S":
	# A segment selector register indexed by the "reg" field
	env.addReg(ModRMRegIndex)
	env.addToDisassembly(
	"printSegment(out, %s);\n" % ModRMRegIndex)
	Name += "_S"
	elif opType.tag in ("G", "P", "T", "V"):
	# Use the "reg" field of the ModRM byte to select the register
	env.addReg(ModRMRegIndex)
	env.addToDisassembly(
	"printReg(out, InstRegIndex(%s), regSize);\n" %
	ModRMRegIndex)

	if opType.tag == "P":

	Name += "_MMX"
	elif opType.tag == "V":
	Name += "_XMM"
	else:
	Name += "_R"
	elif opType.tag in ("E", "Q", "W"):
	# This might refer to memory or to a register. We need to
	# divide it up farther.
	regEnv = copy.copy(env)
	regEnv.addReg(ModRMRMIndex)
	regEnv.addToDisassembly(
	"printReg(out, InstRegIndex(%s), regSize);\n" %
	ModRMRMIndex)

	# This refers to memory. The macroop constructor should set up

	# modrm addressing.
	memEnv = copy.copy(env)
	memEnv.doModRM = True
	regSuffix = "_R"
	if opType.tag == "Q":
	regSuffix = "_MMX"
	elif opType.tag == "W":
	regSuffix = "_XMM"
	return doSplitDecode("MODRM_MOD",
	{"3" : (specializeInst, Name + regSuffix,
	copy.copy(opTypes), regEnv)},
	(doRipRelativeDecode, Name,
	copy.copy(opTypes), memEnv))
	elif opType.tag in ("I", "J"):
	# Immediates
	env.addToDisassembly(
	"ccprintf(out, \"%#x\", machInst.immediate);\n")
	Name += "_I"
	elif opType.tag == "O":
	# Immediate containing a memory offset
	Name += "_MI"
	elif opType.tag in ("PR", "R", "VR"):
	# Non register modrm settings should cause an error
	env.addReg(ModRMRMIndex)
	env.addToDisassembly(
	"printReg(out, InstRegIndex(%s), regSize);\n" %
	ModRMRMIndex)

	if opType.tag == "PR":

	Name += "_MMX"
	elif opType.tag == "VR":
	Name += "_XMM"
	else:
	Name += "_R"
	elif opType.tag in ("X", "Y"):
	# This type of memory addressing is for string instructions.
	# They'll use the right index and segment internally.
	if opType.tag == "X":
	env.addToDisassembly(
	'''printMem(out, env.seg,
	1, X86ISA::ZeroReg, X86ISA::INTREG_RSI, 0,
	env.addressSize, false);''')
	else:
	env.addToDisassembly(
	'''printMem(out, SEGMENT_REG_ES,
	1, X86ISA::ZeroReg, X86ISA::INTREG_RDI, 0,
	env.addressSize, false);''')
	Name += "_M"
	else:
	raise Exception("Unrecognized tag {}.".format(opType.tag))

	# Generate code to return a macroop of the given name which will
	# operate in the "emulation environment" env
	return genMacroop(Name, env)
	}};