| # Simulator main loop for m32rx. -*- C -*- | 
 | # | 
 | # Copyright 1996-2021 Free Software Foundation, Inc. | 
 | # | 
 | # This file is part of the GNU Simulators. | 
 | # | 
 | # This program is free software; you can redistribute it and/or modify | 
 | # it under the terms of the GNU General Public License as published by | 
 | # the Free Software Foundation; either version 3 of the License, or | 
 | # (at your option) any later version. | 
 | # | 
 | # This program is distributed in the hope that it will be useful, | 
 | # but WITHOUT ANY WARRANTY; without even the implied warranty of | 
 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
 | # GNU General Public License for more details. | 
 | # | 
 | # You should have received a copy of the GNU General Public License | 
 | # along with this program.  If not, see <http://www.gnu.org/licenses/>. | 
 |  | 
 | # Syntax: | 
 | # /bin/sh mainloop.in command | 
 | # | 
 | # Command is one of: | 
 | # | 
 | # init | 
 | # support | 
 | # extract-{simple,scache,pbb} | 
 | # {full,fast}-exec-{simple,scache,pbb} | 
 | # | 
 | # A target need only provide a "full" version of one of simple,scache,pbb. | 
 | # If the target wants it can also provide a fast version of same, or if | 
 | # the slow (full featured) version is `simple', then the fast version can be | 
 | # one of scache/pbb. | 
 | # A target can't provide more than this. | 
 |  | 
 | # ??? After a few more ports are done, revisit. | 
 | # Will eventually need to machine generate a lot of this. | 
 |  | 
 | case "x$1" in | 
 |  | 
 | xsupport) | 
 |  | 
 | cat <<EOF | 
 |  | 
 | /* Emit insns to write back the results of insns executed in parallel. | 
 |    SC points to a sufficient number of scache entries for the writeback | 
 |    handlers. | 
 |    SC1/ID1 is the first insn (left slot, lower address). | 
 |    SC2/ID2 is the second insn (right slot, higher address).  */ | 
 |  | 
 | static INLINE void | 
 | emit_par_finish (SIM_CPU *current_cpu, PCADDR pc, SCACHE *sc, | 
 | 		 SCACHE *sc1, const IDESC *id1, SCACHE *sc2, const IDESC *id2) | 
 | { | 
 |   ARGBUF *abuf; | 
 |  | 
 |   abuf = &sc->argbuf; | 
 |   id1 = id1->par_idesc; | 
 |   abuf->fields.write.abuf = &sc1->argbuf; | 
 |   @cpu@_fill_argbuf (current_cpu, abuf, id1, pc, 0); | 
 |   /* no need to set trace_p,profile_p */ | 
 | #if 0 /* not currently needed for id2 since results written directly */ | 
 |   abuf = &sc[1].argbuf; | 
 |   id2 = id2->par_idesc; | 
 |   abuf->fields.write.abuf = &sc2->argbuf; | 
 |   @cpu@_fill_argbuf (current_cpu, abuf, id2, pc + 2, 0); | 
 |   /* no need to set trace_p,profile_p */ | 
 | #endif | 
 | } | 
 |  | 
 | static INLINE const IDESC * | 
 | emit_16 (SIM_CPU *current_cpu, PCADDR pc, CGEN_INSN_INT insn, | 
 | 	 SCACHE *sc, int fast_p, int parallel_p) | 
 | { | 
 |   ARGBUF *abuf = &sc->argbuf; | 
 |   const IDESC *id = @cpu@_decode (current_cpu, pc, insn, insn, abuf); | 
 |  | 
 |   if (parallel_p) | 
 |     id = id->par_idesc; | 
 |   @cpu@_fill_argbuf (current_cpu, abuf, id, pc, fast_p); | 
 |   return id; | 
 | } | 
 |  | 
 | static INLINE const IDESC * | 
 | emit_full16 (SIM_CPU *current_cpu, PCADDR pc, CGEN_INSN_INT insn, SCACHE *sc, | 
 | 	     int trace_p, int profile_p) | 
 | { | 
 |   const IDESC *id; | 
 |  | 
 |   @cpu@_emit_before (current_cpu, sc, pc, 1); | 
 |   id = emit_16 (current_cpu, pc, insn, sc + 1, 0, 0); | 
 |   @cpu@_emit_after (current_cpu, sc + 2, pc); | 
 |   sc[1].argbuf.trace_p = trace_p; | 
 |   sc[1].argbuf.profile_p = profile_p; | 
 |   return id; | 
 | } | 
 |  | 
 | static INLINE const IDESC * | 
 | emit_parallel (SIM_CPU *current_cpu, PCADDR pc, CGEN_INSN_INT insn, | 
 | 	       SCACHE *sc, int fast_p) | 
 | { | 
 |   const IDESC *id,*id2; | 
 |  | 
 |   /* Emit both insns, then emit a finisher-upper. | 
 |      We speed things up by handling the second insn serially | 
 |      [not parallelly].  Then the writeback only has to deal | 
 |      with the first insn.  */ | 
 |   /* ??? Revisit to handle exceptions right.  */ | 
 |  | 
 |   /* FIXME: No need to handle this parallely if second is nop.  */ | 
 |   id = emit_16 (current_cpu, pc, insn >> 16, sc, fast_p, 1); | 
 |  | 
 |   /* Note that this can never be a cti.  No cti's go in the S pipeline.  */ | 
 |   id2 = emit_16 (current_cpu, pc + 2, insn & 0x7fff, sc + 1, fast_p, 0); | 
 |  | 
 |   /* Set sc/snc insns notion of where to skip to.  */ | 
 |   if (IDESC_SKIP_P (id)) | 
 |     SEM_SKIP_COMPILE (current_cpu, sc, 1); | 
 |  | 
 |   /* Emit code to finish executing the semantics | 
 |      (write back the results).  */ | 
 |   emit_par_finish (current_cpu, pc, sc + 2, sc, id, sc + 1, id2); | 
 |  | 
 |   return id; | 
 | } | 
 |  | 
 | static INLINE const IDESC * | 
 | emit_full_parallel (SIM_CPU *current_cpu, PCADDR pc, CGEN_INSN_INT insn, | 
 | 		    SCACHE *sc, int trace_p, int profile_p) | 
 | { | 
 |   const IDESC *id,*id2; | 
 |  | 
 |   /* Emit both insns, then emit a finisher-upper. | 
 |      We speed things up by handling the second insn serially | 
 |      [not parallelly].  Then the writeback only has to deal | 
 |      with the first insn.  */ | 
 |   /* ??? Revisit to handle exceptions right.  */ | 
 |  | 
 |   @cpu@_emit_before (current_cpu, sc, pc, 1); | 
 |  | 
 |   /* FIXME: No need to handle this parallelly if second is nop.  */ | 
 |   id = emit_16 (current_cpu, pc, insn >> 16, sc + 1, 0, 1); | 
 |   sc[1].argbuf.trace_p = trace_p; | 
 |   sc[1].argbuf.profile_p = profile_p; | 
 |  | 
 |   @cpu@_emit_before (current_cpu, sc + 2, pc, 0); | 
 |  | 
 |   /* Note that this can never be a cti.  No cti's go in the S pipeline.  */ | 
 |   id2 = emit_16 (current_cpu, pc + 2, insn & 0x7fff, sc + 3, 0, 0); | 
 |   sc[3].argbuf.trace_p = trace_p; | 
 |   sc[3].argbuf.profile_p = profile_p; | 
 |  | 
 |   /* Set sc/snc insns notion of where to skip to.  */ | 
 |   if (IDESC_SKIP_P (id)) | 
 |     SEM_SKIP_COMPILE (current_cpu, sc, 4); | 
 |  | 
 |   /* Emit code to finish executing the semantics | 
 |      (write back the results).  */ | 
 |   emit_par_finish (current_cpu, pc, sc + 4, sc + 1, id, sc + 3, id2); | 
 |  | 
 |   @cpu@_emit_after (current_cpu, sc + 5, pc); | 
 |  | 
 |   return id; | 
 | } | 
 |  | 
 | static INLINE const IDESC * | 
 | emit_32 (SIM_CPU *current_cpu, PCADDR pc, CGEN_INSN_INT insn, | 
 | 	 SCACHE *sc, int fast_p) | 
 | { | 
 |   ARGBUF *abuf = &sc->argbuf; | 
 |   const IDESC *id = @cpu@_decode (current_cpu, pc, | 
 | 				  (USI) insn >> 16, insn, abuf); | 
 |  | 
 |   @cpu@_fill_argbuf (current_cpu, abuf, id, pc, fast_p); | 
 |   return id; | 
 | } | 
 |  | 
 | static INLINE const IDESC * | 
 | emit_full32 (SIM_CPU *current_cpu, PCADDR pc, CGEN_INSN_INT insn, SCACHE *sc, | 
 | 	     int trace_p, int profile_p) | 
 | { | 
 |   const IDESC *id; | 
 |  | 
 |   @cpu@_emit_before (current_cpu, sc, pc, 1); | 
 |   id = emit_32 (current_cpu, pc, insn, sc + 1, 0); | 
 |   @cpu@_emit_after (current_cpu, sc + 2, pc); | 
 |   sc[1].argbuf.trace_p = trace_p; | 
 |   sc[1].argbuf.profile_p = profile_p; | 
 |   return id; | 
 | } | 
 |  | 
 | EOF | 
 |  | 
 | ;; | 
 |  | 
 | xinit) | 
 |  | 
 | # Nothing needed. | 
 |  | 
 | ;; | 
 |  | 
 | xextract-pbb) | 
 |  | 
 | # Inputs:  current_cpu, pc, sc, max_insns, FAST_P | 
 | # Outputs: sc, pc | 
 | # sc must be left pointing past the last created entry. | 
 | # pc must be left pointing past the last created entry. | 
 | # If the pbb is terminated by a cti insn, SET_CTI_VPC(sc) must be called | 
 | # to record the vpc of the cti insn. | 
 | # SET_INSN_COUNT(n) must be called to record number of real insns. | 
 |  | 
 | cat <<EOF | 
 | { | 
 |   const IDESC *idesc; | 
 |   int icount = 0; | 
 |  | 
 |   if ((pc & 3) != 0) | 
 |     { | 
 |       /* This occurs when single stepping and when compiling the not-taken | 
 | 	 part of conditional branches.  */ | 
 |       UHI insn = GETIMEMUHI (current_cpu, pc); | 
 |       int trace_p = PC_IN_TRACE_RANGE_P (current_cpu, pc); | 
 |       int profile_p = PC_IN_PROFILE_RANGE_P (current_cpu, pc); | 
 |       SCACHE *cti_sc; /* ??? tmp hack */ | 
 |  | 
 |       /* A parallel insn isn't allowed here, but we don't mind nops. | 
 | 	 ??? We need to wait until the insn is executed before signalling | 
 | 	 the error, for situations where such signalling is wanted.  */ | 
 | #if 0 | 
 |       if ((insn & 0x8000) != 0 | 
 | 	  && (insn & 0x7fff) != 0x7000) /* parallel nops are ok */ | 
 | 	sim_engine_invalid_insn (current_cpu, pc, 0); | 
 | #endif | 
 |  | 
 |       /* Only emit before/after handlers if necessary.  */ | 
 |       if (FAST_P || (! trace_p && ! profile_p)) | 
 | 	{ | 
 | 	  idesc = emit_16 (current_cpu, pc, insn & 0x7fff, sc, FAST_P, 0); | 
 | 	  cti_sc = sc; | 
 | 	  ++sc; | 
 | 	  --max_insns; | 
 | 	} | 
 |       else | 
 | 	{ | 
 | 	  idesc = emit_full16 (current_cpu, pc, insn & 0x7fff, sc, | 
 | 			       trace_p, profile_p); | 
 | 	  cti_sc = sc + 1; | 
 | 	  sc += 3; | 
 | 	  max_insns -= 3; | 
 | 	} | 
 |       ++icount; | 
 |       pc += 2; | 
 |       if (IDESC_CTI_P (idesc)) | 
 | 	{ | 
 | 	  SET_CTI_VPC (cti_sc); | 
 | 	  goto Finish; | 
 | 	} | 
 |     } | 
 |  | 
 |   /* There are two copies of the compiler: full(!fast) and fast. | 
 |      The "full" case emits before/after handlers for each insn. | 
 |      Having two copies of this code is a tradeoff, having one copy | 
 |      seemed a bit more difficult to read (due to constantly testing | 
 |      FAST_P).  ??? On the other hand, with address ranges we'll want to | 
 |      omit before/after handlers for unwanted insns.  Having separate loops | 
 |      for FAST/!FAST avoids constantly doing the test in the loop, but | 
 |      typically FAST_P is a constant and such tests will get optimized out.  */ | 
 |  | 
 |   if (FAST_P) | 
 |     { | 
 |       while (max_insns > 0) | 
 | 	{ | 
 | 	  USI insn = GETIMEMUSI (current_cpu, pc); | 
 | 	  if ((SI) insn < 0) | 
 | 	    { | 
 | 	      /* 32 bit insn */ | 
 | 	      idesc = emit_32 (current_cpu, pc, insn, sc, 1); | 
 | 	      ++sc; | 
 | 	      --max_insns; | 
 | 	      ++icount; | 
 | 	      pc += 4; | 
 | 	      if (IDESC_CTI_P (idesc)) | 
 | 		{ | 
 | 		  SET_CTI_VPC (sc - 1); | 
 | 		  break; | 
 | 		} | 
 | 	    } | 
 | 	  else | 
 | 	    { | 
 | 	      if ((insn & 0x8000) != 0) /* parallel? */ | 
 | 		{ | 
 | 		  int up_count; | 
 |  | 
 | 		  if (((insn >> 16) & 0xfff0) == 0x10f0) | 
 | 		    { | 
 | 		      /* FIXME: No need to handle this sequentially if system | 
 | 		         calls will be able to execute after second insn in | 
 | 		         parallel. ( trap #num || insn ) */ | 
 | 		      /* insn */ | 
 | 		      idesc = emit_16 (current_cpu, pc + 2, insn & 0x7fff, | 
 |  				       sc, 1, 0); | 
 | 		      /* trap */ | 
 | 		      emit_16 (current_cpu, pc, insn >> 16, sc + 1, 1, 0); | 
 | 		      up_count = 2; | 
 | 		    } | 
 | 		  else | 
 | 		    { | 
 | 		      /* Yep.  Here's the "interesting" [sic] part.  */ | 
 | 		      idesc = emit_parallel (current_cpu, pc, insn, sc, 1); | 
 | 		      up_count = 3; | 
 | 		    } | 
 | 		  sc += up_count; | 
 | 		  max_insns -= up_count; | 
 | 		  icount += 2; | 
 | 		  pc += 4; | 
 | 		  if (IDESC_CTI_P (idesc)) | 
 | 		    { | 
 | 		      SET_CTI_VPC (sc - up_count); | 
 | 		      break; | 
 | 		    } | 
 | 		} | 
 | 	      else /* 2 serial 16 bit insns */ | 
 | 		{ | 
 | 		  idesc = emit_16 (current_cpu, pc, insn >> 16, sc, 1, 0); | 
 | 		  ++sc; | 
 | 		  --max_insns; | 
 | 		  ++icount; | 
 | 		  pc += 2; | 
 | 		  if (IDESC_CTI_P (idesc)) | 
 | 		    { | 
 | 		      SET_CTI_VPC (sc - 1); | 
 | 		      break; | 
 | 		    } | 
 | 		  /* While we're guaranteed that there's room to extract the | 
 | 		     insn, when single stepping we can't; the pbb must stop | 
 | 		     after the first insn.  */ | 
 | 		  if (max_insns == 0) | 
 | 		    break; | 
 | 		  idesc = emit_16 (current_cpu, pc, insn & 0x7fff, sc, 1, 0); | 
 | 		  ++sc; | 
 | 		  --max_insns; | 
 | 		  ++icount; | 
 | 		  pc += 2; | 
 | 		  if (IDESC_CTI_P (idesc)) | 
 | 		    { | 
 | 		      SET_CTI_VPC (sc - 1); | 
 | 		      break; | 
 | 		    } | 
 | 		} | 
 | 	    } | 
 | 	} | 
 |     } | 
 |   else /* ! FAST_P */ | 
 |     { | 
 |       while (max_insns > 0) | 
 | 	{ | 
 | 	  USI insn = GETIMEMUSI (current_cpu, pc); | 
 | 	  int trace_p = PC_IN_TRACE_RANGE_P (current_cpu, pc); | 
 | 	  int profile_p = PC_IN_PROFILE_RANGE_P (current_cpu, pc); | 
 | 	  SCACHE *cti_sc; /* ??? tmp hack */ | 
 | 	  if ((SI) insn < 0) | 
 | 	    { | 
 | 	      /* 32 bit insn | 
 | 		 Only emit before/after handlers if necessary.  */ | 
 | 	      if (trace_p || profile_p) | 
 | 		{ | 
 | 		  idesc = emit_full32 (current_cpu, pc, insn, sc, | 
 | 				       trace_p, profile_p); | 
 | 		  cti_sc = sc + 1; | 
 | 		  sc += 3; | 
 | 		  max_insns -= 3; | 
 | 		} | 
 | 	      else | 
 | 		{ | 
 | 		  idesc = emit_32 (current_cpu, pc, insn, sc, 0); | 
 | 		  cti_sc = sc; | 
 | 		  ++sc; | 
 | 		  --max_insns; | 
 | 		} | 
 | 	      ++icount; | 
 | 	      pc += 4; | 
 | 	      if (IDESC_CTI_P (idesc)) | 
 | 		{ | 
 | 		  SET_CTI_VPC (cti_sc); | 
 | 		  break; | 
 | 		} | 
 | 	    } | 
 | 	  else | 
 | 	    { | 
 | 	      if ((insn & 0x8000) != 0) /* parallel? */ | 
 | 		{ | 
 | 		  /* Yep.  Here's the "interesting" [sic] part. | 
 | 		     Only emit before/after handlers if necessary.  */ | 
 | 		  if (trace_p || profile_p) | 
 | 		    { | 
 | 		      if (((insn >> 16) & 0xfff0) == 0x10f0) | 
 | 			{ | 
 | 			  /* FIXME: No need to handle this sequentially if | 
 | 			     system calls will be able to execute after second | 
 | 			     insn in parallel. ( trap #num || insn ) */ | 
 | 			  /* insn */ | 
 | 			  idesc = emit_full16 (current_cpu, pc + 2, | 
 | 					       insn & 0x7fff, sc, 0, 0); | 
 | 			  /* trap */ | 
 | 			  emit_full16 (current_cpu, pc, insn >> 16, sc + 3, | 
 | 				       0, 0); | 
 | 			} | 
 | 		      else | 
 | 			{ | 
 | 		          idesc = emit_full_parallel (current_cpu, pc, insn, | 
 | 						      sc, trace_p, profile_p); | 
 | 			} | 
 | 		      cti_sc = sc + 1; | 
 | 		      sc += 6; | 
 | 		      max_insns -= 6; | 
 | 		    } | 
 | 		  else | 
 | 		    { | 
 | 		      int up_count; | 
 |  | 
 | 		      if (((insn >> 16) & 0xfff0) == 0x10f0) | 
 | 			{ | 
 |                           /* FIXME: No need to handle this sequentially if | 
 |                              system calls will be able to execute after second | 
 |                              insn in parallel. ( trap #num || insn ) */ | 
 |                           /* insn */ | 
 |                           idesc = emit_16 (current_cpu, pc + 2, insn & 0x7fff, | 
 |                                            sc, 0, 0); | 
 |                           /* trap */ | 
 |                           emit_16 (current_cpu, pc, insn >> 16, sc + 1, 0, 0); | 
 |                           up_count = 2; | 
 | 			} | 
 | 		      else | 
 | 			{ | 
 | 		          idesc = emit_parallel (current_cpu, pc, insn, sc, 0); | 
 |                           up_count = 3; | 
 | 			} | 
 | 		      cti_sc = sc; | 
 | 		      sc += up_count; | 
 | 		      max_insns -= up_count; | 
 | 		    } | 
 | 		  icount += 2; | 
 | 		  pc += 4; | 
 | 		  if (IDESC_CTI_P (idesc)) | 
 | 		    { | 
 | 		      SET_CTI_VPC (cti_sc); | 
 | 		      break; | 
 | 		    } | 
 | 		} | 
 | 	      else /* 2 serial 16 bit insns */ | 
 | 		{ | 
 | 		  /* Only emit before/after handlers if necessary.  */ | 
 | 		  if (trace_p || profile_p) | 
 | 		    { | 
 | 		      idesc = emit_full16 (current_cpu, pc, insn >> 16, sc, | 
 | 					   trace_p, profile_p); | 
 | 		      cti_sc = sc + 1; | 
 | 		      sc += 3; | 
 | 		      max_insns -= 3; | 
 | 		    } | 
 | 		  else | 
 | 		    { | 
 | 		      idesc = emit_16 (current_cpu, pc, insn >> 16, sc, 0, 0); | 
 | 		      cti_sc = sc; | 
 | 		      ++sc; | 
 | 		      --max_insns; | 
 | 		    } | 
 | 		  ++icount; | 
 | 		  pc += 2; | 
 | 		  if (IDESC_CTI_P (idesc)) | 
 | 		    { | 
 | 		      SET_CTI_VPC (cti_sc); | 
 | 		      break; | 
 | 		    } | 
 | 		  /* While we're guaranteed that there's room to extract the | 
 | 		     insn, when single stepping we can't; the pbb must stop | 
 | 		     after the first insn.  */ | 
 | 		  if (max_insns <= 0) | 
 | 		    break; | 
 | 		  /* Use the same trace/profile address for the 2nd insn. | 
 | 		     Saves us having to compute it and they come in pairs | 
 | 		     anyway (e.g. can never branch to the 2nd insn).  */ | 
 | 		  if (trace_p || profile_p) | 
 | 		    { | 
 | 		      idesc = emit_full16 (current_cpu, pc, insn & 0x7fff, sc, | 
 | 					   trace_p, profile_p); | 
 | 		      cti_sc = sc + 1; | 
 | 		      sc += 3; | 
 | 		      max_insns -= 3; | 
 | 		    } | 
 | 		  else | 
 | 		    { | 
 | 		      idesc = emit_16 (current_cpu, pc, insn & 0x7fff, sc, 0, 0); | 
 | 		      cti_sc = sc; | 
 | 		      ++sc; | 
 | 		      --max_insns; | 
 | 		    } | 
 | 		  ++icount; | 
 | 		  pc += 2; | 
 | 		  if (IDESC_CTI_P (idesc)) | 
 | 		    { | 
 | 		      SET_CTI_VPC (cti_sc); | 
 | 		      break; | 
 | 		    } | 
 | 		} | 
 | 	    } | 
 | 	} | 
 |     } | 
 |  | 
 |  Finish: | 
 |   SET_INSN_COUNT (icount); | 
 | } | 
 | EOF | 
 |  | 
 | ;; | 
 |  | 
 | xfull-exec-pbb) | 
 |  | 
 | # Inputs: current_cpu, vpc, FAST_P | 
 | # Outputs: vpc | 
 | # vpc is the virtual program counter. | 
 |  | 
 | cat <<EOF | 
 | #define DEFINE_SWITCH | 
 | #include "semx-switch.c" | 
 | EOF | 
 |  | 
 | ;; | 
 |  | 
 | *) | 
 |   echo "Invalid argument to mainloop.in: $1" >&2 | 
 |   exit 1 | 
 |   ;; | 
 |  | 
 | esac |