1 %{
2 /* Parser for i386 CPU description.
3    Copyright (C) 2004, 2005, 2007, 2008, 2009 Red Hat, Inc.
4    Written by Ulrich Drepper <drepper@redhat.com>, 2004.
5 
6    This file is free software; you can redistribute it and/or modify
7    it under the terms of either
8 
9      * the GNU Lesser General Public License as published by the Free
10        Software Foundation; either version 3 of the License, or (at
11        your option) any later version
12 
13    or
14 
15      * the GNU General Public License as published by the Free
16        Software Foundation; either version 2 of the License, or (at
17        your option) any later version
18 
19    or both in parallel, as here.
20 
21    elfutils is distributed in the hope that it will be useful, but
22    WITHOUT ANY WARRANTY; without even the implied warranty of
23    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
24    General Public License for more details.
25 
26    You should have received copies of the GNU General Public License and
27    the GNU Lesser General Public License along with this program.  If
28    not, see <http://www.gnu.org/licenses/>.  */
29 
30 #ifdef HAVE_CONFIG_H
31 # include <config.h>
32 #endif
33 
34 #include <assert.h>
35 #include <ctype.h>
36 #include <errno.h>
37 #include <inttypes.h>
38 #include <libintl.h>
39 #include <math.h>
40 #include <obstack.h>
41 #include <search.h>
42 #include <stdbool.h>
43 #include <stdio.h>
44 #include <stdlib.h>
45 #include <string.h>
46 
47 #include <libeu.h>
48 #include <system.h>
49 
50 #define obstack_chunk_alloc xmalloc
51 #define obstack_chunk_free free
52 
53 /* The error handler.  */
54 static void yyerror (const char *s);
55 
56 extern int yylex (void);
57 extern int i386_lineno;
58 extern char *infname;
59 
60 
61 struct known_bitfield
62 {
63   char *name;
64   unsigned long int bits;
65   int tmp;
66 };
67 
68 
69 struct bitvalue
70 {
71   enum bittype { zeroone, field, failure } type;
72   union
73   {
74     unsigned int value;
75     struct known_bitfield *field;
76   };
77   struct bitvalue *next;
78 };
79 
80 
81 struct argname
82 {
83   enum nametype { string, nfield } type;
84   union
85   {
86     char *str;
87     struct known_bitfield *field;
88   };
89   struct argname *next;
90 };
91 
92 
93 struct argument
94 {
95   struct argname *name;
96   struct argument *next;
97 };
98 
99 
100 struct instruction
101 {
102   /* The byte encoding.  */
103   struct bitvalue *bytes;
104 
105   /* Prefix possible.  */
106   int repe;
107   int rep;
108 
109   /* Mnemonic.  */
110   char *mnemonic;
111 
112   /* Suffix.  */
113   enum { suffix_none = 0, suffix_w, suffix_w0, suffix_W, suffix_tttn,
114 	 suffix_w1, suffix_W1, suffix_D } suffix;
115 
116   /* Flag set if modr/m is used.  */
117   int modrm;
118 
119   /* Operands.  */
120   struct operand
121   {
122     char *fct;
123     char *str;
124     int off1;
125     int off2;
126     int off3;
127   } operands[3];
128 
129   struct instruction *next;
130 };
131 
132 
133 struct synonym
134 {
135   char *from;
136   char *to;
137 };
138 
139 
140 struct suffix
141 {
142   char *name;
143   int idx;
144 };
145 
146 
147 struct argstring
148 {
149   char *str;
150   int idx;
151   int off;
152 };
153 
154 
155 static struct known_bitfield ax_reg =
156   {
157     .name = "ax", .bits = 0, .tmp = 0
158   };
159 
160 static struct known_bitfield dx_reg =
161   {
162     .name = "dx", .bits = 0, .tmp = 0
163   };
164 
165 static struct known_bitfield di_reg =
166   {
167     .name = "es_di", .bits = 0, .tmp = 0
168   };
169 
170 static struct known_bitfield si_reg =
171   {
172     .name = "ds_si", .bits = 0, .tmp = 0
173   };
174 
175 static struct known_bitfield bx_reg =
176   {
177     .name = "ds_bx", .bits = 0, .tmp = 0
178   };
179 
180 
181 static int bitfield_compare (const void *p1, const void *p2);
182 static void new_bitfield (char *name, unsigned long int num);
183 static void check_bits (struct bitvalue *value);
184 static int check_duplicates (struct bitvalue *val);
185 static int check_argsdef (struct bitvalue *bitval, struct argument *args);
186 static int check_bitsused (struct bitvalue *bitval,
187 			   struct known_bitfield *suffix,
188 			   struct argument *args);
189 static struct argname *combine (struct argname *name);
190 static void fillin_arg (struct bitvalue *bytes, struct argname *name,
191 			struct instruction *instr, int n);
192 static void find_numbers (void);
193 static int compare_syn (const void *p1, const void *p2);
194 static int compare_suf (const void *p1, const void *p2);
195 static void instrtable_out (void);
196 #if 0
197 static void create_mnemonic_table (void);
198 #endif
199 
200 static void *bitfields;
201 static struct instruction *instructions;
202 static size_t ninstructions;
203 static void *synonyms;
204 static void *suffixes;
205 static int nsuffixes;
206 static void *mnemonics;
207 size_t nmnemonics;
208 extern FILE *outfile;
209 
210 /* Number of bits used mnemonics.  */
211 #if 0
212 static size_t best_mnemonic_bits;
213 #endif
214 %}
215 
216 %union {
217   unsigned long int num;
218   char *str;
219   char ch;
220   struct known_bitfield *field;
221   struct bitvalue *bit;
222   struct argname *name;
223   struct argument *arg;
224 }
225 
226 %token kMASK
227 %token kPREFIX
228 %token kSUFFIX
229 %token kSYNONYM
230 %token <str> kID
231 %token <num> kNUMBER
232 %token kPERCPERC
233 %token <str> kBITFIELD
234 %token <ch> kCHAR
235 %token kSPACE
236 
237 %type <bit> bit byte bytes
238 %type <field> bitfieldopt
239 %type <name> argcomp arg
240 %type <arg> args optargs
241 
242 %defines
243 
244 %%
245 
246 spec:		  masks kPERCPERC '\n' instrs
247 		    {
248 		      if (error_message_count != 0)
249 			error (EXIT_FAILURE, 0,
250 			       "terminated due to previous error");
251 
252 		      instrtable_out ();
253 		    }
254 		;
255 
256 masks:		  masks '\n' mask
257 		| mask
258 		;
259 
260 mask:		  kMASK kBITFIELD kNUMBER
261 		    { new_bitfield ($2, $3); }
262 		| kPREFIX kBITFIELD
263 		    { new_bitfield ($2, -1); }
264 		| kSUFFIX kBITFIELD
265 		    { new_bitfield ($2, -2); }
266 		| kSYNONYM kBITFIELD kBITFIELD
267 		    {
268 		      struct synonym *newp = xmalloc (sizeof (*newp));
269 		      newp->from = $2;
270 		      newp->to = $3;
271 		      if (tfind (newp, &synonyms, compare_syn) != NULL)
272 			error (0, 0,
273 			       "%d: duplicate definition for synonym '%s'",
274 			       i386_lineno, $2);
275 		      else if (tsearch ( newp, &synonyms, compare_syn) == NULL)
276 			error (EXIT_FAILURE, 0, "tsearch");
277 		    }
278 		|
279 		;
280 
281 instrs:		  instrs '\n' instr
282 		| instr
283 		;
284 
285 instr:		  bytes ':' bitfieldopt kID bitfieldopt optargs
286 		    {
287 		      if ($3 != NULL && strcmp ($3->name, "RE") != 0
288 			  && strcmp ($3->name, "R") != 0)
289 			{
290 			  error (0, 0, "%d: only 'R' and 'RE' prefix allowed",
291 				 i386_lineno - 1);
292 			}
293 		      if (check_duplicates ($1) == 0
294 			  && check_argsdef ($1, $6) == 0
295 			  && check_bitsused ($1, $5, $6) == 0)
296 			{
297 			  struct instruction *newp = xcalloc (sizeof (*newp),
298 							      1);
299 			  if ($3 != NULL)
300 			    {
301 			      if (strcmp ($3->name, "RE") == 0)
302 				newp->repe = 1;
303 			      else if (strcmp ($3->name, "R") == 0)
304 				newp->rep = 1;
305 			    }
306 
307 			  newp->bytes = $1;
308 			  newp->mnemonic = $4;
309 			  if (newp->mnemonic != (void *) -1l
310 			      && tfind ($4, &mnemonics,
311 					(int (*)(const void *, const void *)) strcmp) == NULL)
312 			    {
313 			      if (tsearch ($4, &mnemonics,
314 					   (int (*)(const void *, const void *)) strcmp) == NULL)
315 				error (EXIT_FAILURE, errno, "tsearch");
316 			      ++nmnemonics;
317 			    }
318 
319 			  if ($5 != NULL)
320 			    {
321 			      if (strcmp ($5->name, "w") == 0)
322 				newp->suffix = suffix_w;
323 			      else if (strcmp ($5->name, "w0") == 0)
324 				newp->suffix = suffix_w0;
325 			      else if (strcmp ($5->name, "tttn") == 0)
326 				newp->suffix = suffix_tttn;
327 			      else if (strcmp ($5->name, "w1") == 0)
328 				newp->suffix = suffix_w1;
329 			      else if (strcmp ($5->name, "W") == 0)
330 				newp->suffix = suffix_W;
331 			      else if (strcmp ($5->name, "W1") == 0)
332 				newp->suffix = suffix_W1;
333 			      else if (strcmp ($5->name, "D") == 0)
334 				newp->suffix = suffix_D;
335 			      else
336 				error (EXIT_FAILURE, 0,
337 				       "%s: %d: unknown suffix '%s'",
338 				       infname, i386_lineno - 1, $5->name);
339 
340 			      struct suffix search = { .name = $5->name };
341 			      if (tfind (&search, &suffixes, compare_suf)
342 				  == NULL)
343 				{
344 				  struct suffix *ns = xmalloc (sizeof (*ns));
345 				  ns->name = $5->name;
346 				  ns->idx = ++nsuffixes;
347 				  if (tsearch (ns, &suffixes, compare_suf)
348 				      == NULL)
349 				    error (EXIT_FAILURE, errno, "tsearch");
350 				}
351 			    }
352 
353 			  struct argument *args = $6;
354 			  int n = 0;
355 			  while (args != NULL)
356 			    {
357 			      fillin_arg ($1, args->name, newp, n);
358 
359 			      args = args->next;
360 			      ++n;
361 			    }
362 
363 			  newp->next = instructions;
364 			  instructions = newp;
365 			  ++ninstructions;
366 			}
367 		    }
368 		|
369 		;
370 
371 bitfieldopt:	  kBITFIELD
372 		    {
373 		      struct known_bitfield search;
374 		      search.name = $1;
375 		      struct known_bitfield **res;
376 		      res = tfind (&search, &bitfields, bitfield_compare);
377 		      if (res == NULL)
378 			{
379 			  error (0, 0, "%d: unknown bitfield '%s'",
380 				 i386_lineno, search.name);
381 			  $$ = NULL;
382 			}
383 		      else
384 			$$ = *res;
385 		    }
386 		|
387 		    { $$ = NULL; }
388 		;
389 
390 bytes:		  bytes ',' byte
391 		    {
392 		      check_bits ($3);
393 
394 		      struct bitvalue *runp = $1;
395 		      while (runp->next != NULL)
396 			runp = runp->next;
397 		      runp->next = $3;
398 		      $$ = $1;
399 		    }
400 		| byte
401 		    {
402 		      check_bits ($1);
403 		      $$ = $1;
404 		    }
405 		;
406 
407 byte:		  byte bit
408 		    {
409 		      struct bitvalue *runp = $1;
410 		      while (runp->next != NULL)
411 			runp = runp->next;
412 		      runp->next = $2;
413 		      $$ = $1;
414 		    }
415 		| bit
416 		    { $$ = $1; }
417 		;
418 
419 bit:		  '0'
420 		    {
421 		      $$ = xmalloc (sizeof (struct bitvalue));
422 		      $$->type = zeroone;
423 		      $$->value = 0;
424 		      $$->next = NULL;
425 		    }
426 		| '1'
427 		    {
428 		      $$ = xmalloc (sizeof (struct bitvalue));
429 		      $$->type = zeroone;
430 		      $$->value = 1;
431 		      $$->next = NULL;
432 		    }
433 		| kBITFIELD
434 		    {
435 		      $$ = xmalloc (sizeof (struct bitvalue));
436 		      struct known_bitfield search;
437 		      search.name = $1;
438 		      struct known_bitfield **res;
439 		      res = tfind (&search, &bitfields, bitfield_compare);
440 		      if (res == NULL)
441 			{
442 			  error (0, 0, "%d: unknown bitfield '%s'",
443 				 i386_lineno, search.name);
444 			  $$->type = failure;
445 			}
446 		      else
447 			{
448 			  $$->type = field;
449 			  $$->field = *res;
450 			}
451 		      $$->next = NULL;
452 		    }
453 		;
454 
455 optargs:	  kSPACE args
456 		    { $$ = $2; }
457 		|
458 		    { $$ = NULL; }
459 		;
460 
461 args:		  args ',' arg
462 		    {
463 		      struct argument *runp = $1;
464 		      while (runp->next != NULL)
465 			runp = runp->next;
466 		      runp->next = xmalloc (sizeof (struct argument));
467 		      runp->next->name = combine ($3);
468 		      runp->next->next = NULL;
469 		      $$ = $1;
470 		    }
471 		| arg
472 		    {
473 		      $$ = xmalloc (sizeof (struct argument));
474 		      $$->name = combine ($1);
475 		      $$->next = NULL;
476 		    }
477 		;
478 
479 arg:		  arg argcomp
480 		    {
481 		      struct argname *runp = $1;
482 		      while (runp->next != NULL)
483 			runp = runp->next;
484 		      runp->next = $2;
485 		      $$ = $1;
486 		    }
487 		| argcomp
488 		    { $$ = $1; }
489 		;
490 argcomp:	  kBITFIELD
491 		    {
492 		      $$ = xmalloc (sizeof (struct argname));
493 		      $$->type = nfield;
494 		      $$->next = NULL;
495 
496 		      struct known_bitfield search;
497 		      search.name = $1;
498 		      struct known_bitfield **res;
499 		      res = tfind (&search, &bitfields, bitfield_compare);
500 		      if (res == NULL)
501 			{
502 			  if (strcmp ($1, "ax") == 0)
503 			    $$->field = &ax_reg;
504 			  else if (strcmp ($1, "dx") == 0)
505 			    $$->field = &dx_reg;
506 			  else if (strcmp ($1, "es_di") == 0)
507 			    $$->field = &di_reg;
508 			  else if (strcmp ($1, "ds_si") == 0)
509 			    $$->field = &si_reg;
510 			  else if (strcmp ($1, "ds_bx") == 0)
511 			    $$->field = &bx_reg;
512 			  else
513 			    {
514 			      error (0, 0, "%d: unknown bitfield '%s'",
515 				     i386_lineno, search.name);
516 			      $$->field = NULL;
517 			    }
518 			}
519 		      else
520 			$$->field = *res;
521 		    }
522 		| kCHAR
523 		    {
524 		      $$ = xmalloc (sizeof (struct argname));
525 		      $$->type = string;
526 		      $$->next = NULL;
527 		      $$->str = xmalloc (2);
528 		      $$->str[0] = $1;
529 		      $$->str[1] = '\0';
530 		    }
531 		| kID
532 		    {
533 		      $$ = xmalloc (sizeof (struct argname));
534 		      $$->type = string;
535 		      $$->next = NULL;
536 		      $$->str = $1;
537 		    }
538 		| ':'
539 		    {
540 		      $$ = xmalloc (sizeof (struct argname));
541 		      $$->type = string;
542 		      $$->next = NULL;
543 		      $$->str = xmalloc (2);
544 		      $$->str[0] = ':';
545 		      $$->str[1] = '\0';
546 		    }
547 		;
548 
549 %%
550 
551 static void
552 yyerror (const char *s)
553 {
554   error (0, 0, _("while reading i386 CPU description: %s at line %d"),
555          _(s), i386_lineno);
556 }
557 
558 
559 static int
bitfield_compare(const void * p1,const void * p2)560 bitfield_compare (const void *p1, const void *p2)
561 {
562   struct known_bitfield *f1 = (struct known_bitfield *) p1;
563   struct known_bitfield *f2 = (struct known_bitfield *) p2;
564 
565   return strcmp (f1->name, f2->name);
566 }
567 
568 
569 static void
new_bitfield(char * name,unsigned long int num)570 new_bitfield (char *name, unsigned long int num)
571 {
572   struct known_bitfield *newp = xmalloc (sizeof (struct known_bitfield));
573   newp->name = name;
574   newp->bits = num;
575   newp->tmp = 0;
576 
577   if (tfind (newp, &bitfields, bitfield_compare) != NULL)
578     {
579       error (0, 0, "%d: duplicated definition of bitfield '%s'",
580 	     i386_lineno, name);
581       free (name);
582       free (newp);
583       return;
584     }
585 
586   if (tsearch (newp, &bitfields, bitfield_compare) == NULL)
587     error (EXIT_FAILURE, errno, "%d: cannot insert new bitfield '%s'",
588 	   i386_lineno, name);
589 }
590 
591 
592 /* Check that the number of bits is a multiple of 8.  */
593 static void
check_bits(struct bitvalue * val)594 check_bits (struct bitvalue *val)
595 {
596   struct bitvalue *runp = val;
597   unsigned int total = 0;
598 
599   while (runp != NULL)
600     {
601       if (runp->type == zeroone)
602 	++total;
603       else if (runp->field == NULL)
604 	/* No sense doing anything, the field is not known.  */
605 	return;
606       else
607 	total += runp->field->bits;
608 
609       runp = runp->next;
610     }
611 
612   if (total % 8 != 0)
613     {
614       struct obstack os;
615       obstack_init (&os);
616 
617       while (val != NULL)
618 	{
619 	  if (val->type == zeroone)
620 	    obstack_printf (&os, "%u", val->value);
621 	  else
622 	    obstack_printf (&os, "{%s}", val->field->name);
623 	  val = val->next;
624 	}
625       obstack_1grow (&os, '\0');
626 
627       error (0, 0, "%d: field '%s' not a multiple of 8 bits in size",
628 	     i386_lineno, (char *) obstack_finish (&os));
629 
630       obstack_free (&os, NULL);
631     }
632 }
633 
634 
635 static int
check_duplicates(struct bitvalue * val)636 check_duplicates (struct bitvalue *val)
637 {
638   static int testcnt;
639   ++testcnt;
640 
641   int result = 0;
642   while (val != NULL)
643     {
644       if (val->type == field && val->field != NULL)
645 	{
646 	  if (val->field->tmp == testcnt)
647 	    {
648 	      error (0, 0, "%d: bitfield '%s' used more than once",
649 		     i386_lineno - 1, val->field->name);
650 	      result = 1;
651 	    }
652 	  val->field->tmp = testcnt;
653 	}
654 
655       val = val->next;
656     }
657 
658   return result;
659 }
660 
661 
662 static int
check_argsdef(struct bitvalue * bitval,struct argument * args)663 check_argsdef (struct bitvalue *bitval, struct argument *args)
664 {
665   int result = 0;
666 
667   while (args != NULL)
668     {
669       for (struct argname *name = args->name; name != NULL; name = name->next)
670 	if (name->type == nfield && name->field != NULL
671 	    && name->field != &ax_reg && name->field != &dx_reg
672 	    && name->field != &di_reg && name->field != &si_reg
673 	    && name->field != &bx_reg)
674 	  {
675 	    struct bitvalue *runp = bitval;
676 
677 	    while (runp != NULL)
678 	      if (runp->type == field && runp->field == name->field)
679 		break;
680 	      else
681 		runp = runp->next;
682 
683 	    if (runp == NULL)
684 	      {
685 		error (0, 0, "%d: unknown bitfield '%s' used in output format",
686 		       i386_lineno - 1, name->field->name);
687 		result = 1;
688 	      }
689 	  }
690 
691       args = args->next;
692     }
693 
694   return result;
695 }
696 
697 
698 static int
check_bitsused(struct bitvalue * bitval,struct known_bitfield * suffix,struct argument * args)699 check_bitsused (struct bitvalue *bitval, struct known_bitfield *suffix,
700 		struct argument *args)
701 {
702   int result = 0;
703 
704   while (bitval != NULL)
705     {
706       if (bitval->type == field && bitval->field != NULL
707 	  && bitval->field != suffix
708 	  /* {w} is handled special.  */
709 	  && strcmp (bitval->field->name, "w") != 0)
710 	{
711 	  struct argument *runp;
712 	  for (runp = args; runp != NULL; runp = runp->next)
713 	    {
714 	      struct argname *name = runp->name;
715 
716 	      while (name != NULL)
717 		if (name->type == nfield && name->field == bitval->field)
718 		  break;
719 		else
720 		  name = name->next;
721 
722 	      if (name != NULL)
723 		break;
724 	    }
725 
726 #if 0
727 	  if (runp == NULL)
728 	    {
729 	      error (0, 0, "%d: bitfield '%s' not used",
730 		     i386_lineno - 1, bitval->field->name);
731 	      result = 1;
732 	    }
733 #endif
734 	}
735 
736       bitval = bitval->next;
737     }
738 
739   return result;
740 }
741 
742 
743 static struct argname *
combine(struct argname * name)744 combine (struct argname *name)
745 {
746   struct argname *last_str = NULL;
747   for (struct argname *runp = name; runp != NULL; runp = runp->next)
748     {
749       if (runp->type == string)
750 	{
751 	  if (last_str == NULL)
752 	    last_str = runp;
753 	  else
754 	    {
755 	      last_str->str = xrealloc (last_str->str,
756 					strlen (last_str->str)
757 					+ strlen (runp->str) + 1);
758 	      strcat (last_str->str, runp->str);
759 	      last_str->next = runp->next;
760 	    }
761 	}
762       else
763 	last_str = NULL;
764     }
765   return name;
766 }
767 
768 
769 #define obstack_grow_str(ob, str) obstack_grow (ob, str, strlen (str))
770 
771 
772 static void
fillin_arg(struct bitvalue * bytes,struct argname * name,struct instruction * instr,int n)773 fillin_arg (struct bitvalue *bytes, struct argname *name,
774 	    struct instruction *instr, int n)
775 {
776   static struct obstack ob;
777   static int initialized;
778   if (! initialized)
779     {
780       initialized = 1;
781       obstack_init (&ob);
782     }
783 
784   struct argname *runp = name;
785   int cnt = 0;
786   while (runp != NULL)
787     {
788       /* We ignore strings in the function name.  */
789       if (runp->type == string)
790 	{
791 	  if (instr->operands[n].str != NULL)
792 	    error (EXIT_FAILURE, 0,
793 		   "%d: cannot have more than one string parameter",
794 		   i386_lineno - 1);
795 
796 	  instr->operands[n].str = runp->str;
797 	}
798       else
799 	{
800 	  assert (runp->type == nfield);
801 
802 	  /* Construct the function name.  */
803 	  if (cnt++ > 0)
804 	    obstack_1grow (&ob, '$');
805 
806 	  if (runp->field == NULL)
807 	    /* Add some string which contains invalid characters.  */
808 	    obstack_grow_str (&ob, "!!!INVALID!!!");
809 	  else
810 	    {
811 	      char *fieldname = runp->field->name;
812 
813 	      struct synonym search = { .from = fieldname };
814 
815 	      struct synonym **res = tfind (&search, &synonyms, compare_syn);
816 	      if (res != NULL)
817 		fieldname = (*res)->to;
818 
819 	      obstack_grow_str (&ob, fieldname);
820 	    }
821 
822 	  /* Now compute the bit offset of the field.  */
823 	  struct bitvalue *b = bytes;
824 	  int bitoff = 0;
825 	  if (runp->field != NULL)
826 	    while (b != NULL)
827 	      {
828 		if (b->type == field && b->field != NULL)
829 		  {
830 		    if (strcmp (b->field->name, runp->field->name) == 0)
831 		      break;
832 		    bitoff += b->field->bits;
833 		  }
834 		else
835 		  ++bitoff;
836 
837 		b = b->next;
838 	      }
839 	  if (instr->operands[n].off1 == 0)
840 	    instr->operands[n].off1 = bitoff;
841 	  else if (instr->operands[n].off2 == 0)
842 	    instr->operands[n].off2 = bitoff;
843 	  else if (instr->operands[n].off3 == 0)
844 	    instr->operands[n].off3 = bitoff;
845 	  else
846 	    error (EXIT_FAILURE, 0,
847 		   "%d: cannot have more than three fields in parameter",
848 		   i386_lineno - 1);
849 
850 	  if  (runp->field != NULL
851 	       && strncasecmp (runp->field->name, "mod", 3) == 0)
852 	    instr->modrm = 1;
853 	}
854 
855       runp = runp->next;
856     }
857   if (obstack_object_size (&ob) == 0)
858     obstack_grow_str (&ob, "string");
859   obstack_1grow (&ob, '\0');
860   char *fct = obstack_finish (&ob);
861 
862   instr->operands[n].fct = fct;
863 }
864 
865 
866 #if 0
867 static void
868 nameout (const void *nodep, VISIT value, int level)
869 {
870   if (value == leaf || value == postorder)
871     printf ("  %s\n", *(const char **) nodep);
872 }
873 #endif
874 
875 
876 static int
compare_argstring(const void * p1,const void * p2)877 compare_argstring (const void *p1, const void *p2)
878 {
879   const struct argstring *a1 = (const struct argstring *) p1;
880   const struct argstring *a2 = (const struct argstring *) p2;
881 
882   return strcmp (a1->str, a2->str);
883 }
884 
885 
886 static int maxoff[3][3];
887 static int minoff[3][3] = { { 1000, 1000, 1000 },
888 			    { 1000, 1000, 1000 },
889 			    { 1000, 1000, 1000 } };
890 static int nbitoff[3][3];
891 static void *fct_names[3];
892 static int nbitfct[3];
893 static int nbitsuf;
894 static void *strs[3];
895 static int nbitstr[3];
896 static int total_bits = 2;	// Already counted the rep/repe bits.
897 
898 static void
find_numbers(void)899 find_numbers (void)
900 {
901   int nfct_names[3] = { 0, 0, 0 };
902   int nstrs[3] = { 0, 0, 0 };
903 
904   /* We reverse the order of the instruction list while processing it.
905      Later phases need it in the order in which the input file has
906      them.  */
907   struct instruction *reversed = NULL;
908 
909   struct instruction *runp = instructions;
910   while (runp != NULL)
911     {
912       for (int i = 0; i < 3; ++i)
913 	if (runp->operands[i].fct != NULL)
914 	  {
915 	    struct argstring search = { .str = runp->operands[i].fct };
916 	    if (tfind (&search, &fct_names[i], compare_argstring) == NULL)
917 	      {
918 		struct argstring *newp = xmalloc (sizeof (*newp));
919 		newp->str = runp->operands[i].fct;
920 		newp->idx = 0;
921 		if (tsearch (newp, &fct_names[i], compare_argstring) == NULL)
922 		  error (EXIT_FAILURE, errno, "tsearch");
923 		++nfct_names[i];
924 	      }
925 
926 	    if (runp->operands[i].str != NULL)
927 	      {
928 		search.str = runp->operands[i].str;
929 		if (tfind (&search, &strs[i], compare_argstring) == NULL)
930 		  {
931 		    struct argstring *newp = xmalloc (sizeof (*newp));
932 		    newp->str = runp->operands[i].str;
933 		    newp->idx = 0;
934 		    if (tsearch (newp, &strs[i], compare_argstring) == NULL)
935 		      error (EXIT_FAILURE, errno, "tsearch");
936 		    ++nstrs[i];
937 		  }
938 	      }
939 
940 	    maxoff[i][0] = MAX (maxoff[i][0], runp->operands[i].off1);
941 	    maxoff[i][1] = MAX (maxoff[i][1], runp->operands[i].off2);
942 	    maxoff[i][2] = MAX (maxoff[i][2], runp->operands[i].off3);
943 
944 	    if (runp->operands[i].off1 > 0)
945 	      minoff[i][0] = MIN (minoff[i][0], runp->operands[i].off1);
946 	    if (runp->operands[i].off2 > 0)
947 	      minoff[i][1] = MIN (minoff[i][1], runp->operands[i].off2);
948 	    if (runp->operands[i].off3 > 0)
949 	      minoff[i][2] = MIN (minoff[i][2], runp->operands[i].off3);
950 	  }
951 
952       struct instruction *old = runp;
953       runp = runp->next;
954 
955       old->next = reversed;
956       reversed = old;
957     }
958   instructions = reversed;
959 
960   int d;
961   int c;
962   for (int i = 0; i < 3; ++i)
963     {
964       // printf ("min1 = %d, min2 = %d, min3 = %d\n", minoff[i][0], minoff[i][1], minoff[i][2]);
965       // printf ("max1 = %d, max2 = %d, max3 = %d\n", maxoff[i][0], maxoff[i][1], maxoff[i][2]);
966 
967       if (minoff[i][0] == 1000)
968 	nbitoff[i][0] = 0;
969       else
970 	{
971 	  nbitoff[i][0] = 1;
972 	  d = maxoff[i][0] - minoff[i][0];
973 	  c = 1;
974 	  while (c < d)
975 	    {
976 	      ++nbitoff[i][0];
977 	      c *= 2;
978 	    }
979 	  total_bits += nbitoff[i][0];
980 	}
981 
982       if (minoff[i][1] == 1000)
983 	nbitoff[i][1] = 0;
984       else
985 	{
986 	  nbitoff[i][1] = 1;
987 	  d = maxoff[i][1] - minoff[i][1];
988 	  c = 1;
989 	  while (c < d)
990 	    {
991 	      ++nbitoff[i][1];
992 	      c *= 2;
993 	    }
994 	  total_bits += nbitoff[i][1];
995 	}
996 
997       if (minoff[i][2] == 1000)
998 	nbitoff[i][2] = 0;
999       else
1000 	{
1001 	  nbitoff[i][2] = 1;
1002 	  d = maxoff[i][2] - minoff[i][2];
1003 	  c = 1;
1004 	  while (c < d)
1005 	    {
1006 	      ++nbitoff[i][2];
1007 	      c *= 2;
1008 	    }
1009 	  total_bits += nbitoff[i][2];
1010 	}
1011       // printf ("off1 = %d, off2 = %d, off3 = %d\n", nbitoff[i][0], nbitoff[i][1], nbitoff[i][2]);
1012 
1013       nbitfct[i] = 1;
1014       d = nfct_names[i];
1015       c = 1;
1016       while (c < d)
1017 	{
1018 	  ++nbitfct[i];
1019 	  c *= 2;
1020 	}
1021       total_bits += nbitfct[i];
1022       // printf ("%d fct[%d], %d bits\n", nfct_names[i], i, nbitfct[i]);
1023 
1024       if (nstrs[i] != 0)
1025 	{
1026 	  nbitstr[i] = 1;
1027 	  d = nstrs[i];
1028 	  c = 1;
1029 	  while (c < d)
1030 	    {
1031 	      ++nbitstr[i];
1032 	      c *= 2;
1033 	    }
1034 	  total_bits += nbitstr[i];
1035 	}
1036 
1037       // twalk (fct_names[i], nameout);
1038     }
1039 
1040   nbitsuf = 0;
1041   d = nsuffixes;
1042   c = 1;
1043   while (c < d)
1044     {
1045       ++nbitsuf;
1046       c *= 2;
1047     }
1048   total_bits += nbitsuf;
1049   // printf ("%d suffixes, %d bits\n", nsuffixes, nbitsuf);
1050 }
1051 
1052 
1053 static int
compare_syn(const void * p1,const void * p2)1054 compare_syn (const void *p1, const void *p2)
1055 {
1056   const struct synonym *s1 = (const struct synonym *) p1;
1057   const struct synonym *s2 = (const struct synonym *) p2;
1058 
1059   return strcmp (s1->from, s2->from);
1060 }
1061 
1062 
1063 static int
compare_suf(const void * p1,const void * p2)1064 compare_suf (const void *p1, const void *p2)
1065 {
1066   const struct suffix *s1 = (const struct suffix *) p1;
1067   const struct suffix *s2 = (const struct suffix *) p2;
1068 
1069   return strcmp (s1->name, s2->name);
1070 }
1071 
1072 
1073 static int count_op_str;
1074 static int off_op_str;
1075 static void
print_op_str(const void * nodep,VISIT value,int level)1076 print_op_str (const void *nodep, VISIT value,
1077 	      int level __attribute__ ((unused)))
1078 {
1079   if (value == leaf || value == postorder)
1080     {
1081       const char *str = (*(struct argstring **) nodep)->str;
1082       fprintf (outfile, "%s\n  \"%s",
1083 	       count_op_str == 0 ? "" : "\\0\"", str);
1084       (*(struct argstring **) nodep)->idx = ++count_op_str;
1085       (*(struct argstring **) nodep)->off = off_op_str;
1086       off_op_str += strlen (str) + 1;
1087     }
1088 }
1089 
1090 
1091 static void
print_op_str_idx(const void * nodep,VISIT value,int level)1092 print_op_str_idx (const void *nodep, VISIT value,
1093 		  int level __attribute__ ((unused)))
1094 {
1095   if (value == leaf || value == postorder)
1096     printf ("  %d,\n", (*(struct argstring **) nodep)->off);
1097 }
1098 
1099 
1100 static void
print_op_fct(const void * nodep,VISIT value,int level)1101 print_op_fct (const void *nodep, VISIT value,
1102 	      int level __attribute__ ((unused)))
1103 {
1104   if (value == leaf || value == postorder)
1105     {
1106       fprintf (outfile, "  FCT_%s,\n", (*(struct argstring **) nodep)->str);
1107       (*(struct argstring **) nodep)->idx = ++count_op_str;
1108     }
1109 }
1110 
1111 
1112 #if NMNES < 2
1113 # error "bogus NMNES value"
1114 #endif
1115 
1116 static void
instrtable_out(void)1117 instrtable_out (void)
1118 {
1119   find_numbers ();
1120 
1121 #if 0
1122   create_mnemonic_table ();
1123 
1124   fprintf (outfile, "#define MNEMONIC_BITS %zu\n", best_mnemonic_bits);
1125 #else
1126   fprintf (outfile, "#define MNEMONIC_BITS %ld\n",
1127 	   lrint (ceil (log2 (NMNES))));
1128 #endif
1129   fprintf (outfile, "#define SUFFIX_BITS %d\n", nbitsuf);
1130   for (int i = 0; i < 3; ++i)
1131     {
1132       fprintf (outfile, "#define FCT%d_BITS %d\n", i + 1, nbitfct[i]);
1133       if (nbitstr[i] != 0)
1134 	fprintf (outfile, "#define STR%d_BITS %d\n", i + 1, nbitstr[i]);
1135       fprintf (outfile, "#define OFF%d_1_BITS %d\n", i + 1, nbitoff[i][0]);
1136       fprintf (outfile, "#define OFF%d_1_BIAS %d\n", i + 1, minoff[i][0]);
1137       if (nbitoff[i][1] != 0)
1138 	{
1139 	  fprintf (outfile, "#define OFF%d_2_BITS %d\n", i + 1, nbitoff[i][1]);
1140 	  fprintf (outfile, "#define OFF%d_2_BIAS %d\n", i + 1, minoff[i][1]);
1141 	}
1142       if (nbitoff[i][2] != 0)
1143 	{
1144 	  fprintf (outfile, "#define OFF%d_3_BITS %d\n", i + 1, nbitoff[i][2]);
1145 	  fprintf (outfile, "#define OFF%d_3_BIAS %d\n", i + 1, minoff[i][2]);
1146 	}
1147     }
1148 
1149   fputs ("\n#include <i386_data.h>\n\n", outfile);
1150 
1151 
1152 #define APPEND(a, b) APPEND_ (a, b)
1153 #define APPEND_(a, b) a##b
1154 #define EMIT_SUFFIX(suf) \
1155   fprintf (outfile, "#define suffix_%s %d\n", #suf, APPEND (suffix_, suf))
1156   EMIT_SUFFIX (none);
1157   EMIT_SUFFIX (w);
1158   EMIT_SUFFIX (w0);
1159   EMIT_SUFFIX (W);
1160   EMIT_SUFFIX (tttn);
1161   EMIT_SUFFIX (D);
1162   EMIT_SUFFIX (w1);
1163   EMIT_SUFFIX (W1);
1164 
1165   fputc_unlocked ('\n', outfile);
1166 
1167   for (int i = 0; i < 3; ++i)
1168     {
1169       /* Functions.  */
1170       count_op_str = 0;
1171       fprintf (outfile, "static const opfct_t op%d_fct[] =\n{\n  NULL,\n",
1172 	       i + 1);
1173       twalk (fct_names[i], print_op_fct);
1174       fputs ("};\n", outfile);
1175 
1176       /* The operand strings.  */
1177       if (nbitstr[i] != 0)
1178 	{
1179 	  count_op_str = 0;
1180 	  off_op_str = 0;
1181 	  fprintf (outfile, "static const char op%d_str[] =", i + 1);
1182 	  twalk (strs[i], print_op_str);
1183 	  fputs ("\";\n", outfile);
1184 
1185 	  fprintf (outfile, "static const uint8_t op%d_str_idx[] = {\n",
1186 		   i + 1);
1187 	  twalk (strs[i], print_op_str_idx);
1188 	  fputs ("};\n", outfile);
1189 	}
1190     }
1191 
1192 
1193   fputs ("static const struct instr_enc instrtab[] =\n{\n", outfile);
1194   struct instruction *instr;
1195   for (instr = instructions; instr != NULL; instr = instr->next)
1196     {
1197       fputs ("  {", outfile);
1198       if (instr->mnemonic == (void *) -1l)
1199 	fputs (" .mnemonic = MNE_INVALID,", outfile);
1200       else
1201 	fprintf (outfile, " .mnemonic = MNE_%s,", instr->mnemonic);
1202       fprintf (outfile, " .rep = %d,", instr->rep);
1203       fprintf (outfile, " .repe = %d,", instr->repe);
1204       fprintf (outfile, " .suffix = %d,", instr->suffix);
1205       fprintf (outfile, " .modrm = %d,", instr->modrm);
1206 
1207       for (int i = 0; i < 3; ++i)
1208 	{
1209 	  int idx = 0;
1210 	  if (instr->operands[i].fct != NULL)
1211 	    {
1212 	      struct argstring search = { .str = instr->operands[i].fct };
1213 	      struct argstring **res = tfind (&search, &fct_names[i],
1214 					      compare_argstring);
1215 	      assert (res != NULL);
1216 	      idx = (*res)->idx;
1217 	    }
1218 	  fprintf (outfile, " .fct%d = %d,", i + 1, idx);
1219 
1220 	  idx = 0;
1221 	  if (instr->operands[i].str != NULL)
1222 	    {
1223 	      struct argstring search = { .str = instr->operands[i].str };
1224 	      struct argstring **res = tfind (&search, &strs[i],
1225 					      compare_argstring);
1226 	      assert (res != NULL);
1227 	      idx = (*res)->idx;
1228 	    }
1229 	  if (nbitstr[i] != 0)
1230 	    fprintf (outfile, " .str%d = %d,", i + 1, idx);
1231 
1232 	  fprintf (outfile, " .off%d_1 = %d,", i + 1,
1233 		   MAX (0, instr->operands[i].off1 - minoff[i][0]));
1234 
1235 	  if (nbitoff[i][1] != 0)
1236 	    fprintf (outfile, " .off%d_2 = %d,", i + 1,
1237 		     MAX (0, instr->operands[i].off2 - minoff[i][1]));
1238 
1239 	  if (nbitoff[i][2] != 0)
1240 	    fprintf (outfile, " .off%d_3 = %d,", i + 1,
1241 		     MAX (0, instr->operands[i].off3 - minoff[i][2]));
1242 	}
1243 
1244       fputs (" },\n", outfile);
1245     }
1246   fputs ("};\n", outfile);
1247 
1248   fputs ("static const uint8_t match_data[] =\n{\n", outfile);
1249   size_t cnt = 0;
1250   for (instr = instructions; instr != NULL; instr = instr->next, ++cnt)
1251     {
1252       /* First count the number of bytes.  */
1253       size_t totalbits = 0;
1254       size_t zerobits = 0;
1255       bool leading_p = true;
1256       size_t leadingbits = 0;
1257       struct bitvalue *b = instr->bytes;
1258       while (b != NULL)
1259 	{
1260 	  if (b->type == zeroone)
1261 	    {
1262 	      ++totalbits;
1263 	      zerobits = 0;
1264 	      if (leading_p)
1265 		++leadingbits;
1266 	    }
1267 	  else
1268 	    {
1269 	      totalbits += b->field->bits;
1270 	      /* We must always count the mod/rm byte.  */
1271 	      if (strncasecmp (b->field->name, "mod", 3) == 0)
1272 		zerobits = 0;
1273 	      else
1274 		zerobits += b->field->bits;
1275 	      leading_p = false;
1276 	    }
1277 	  b = b->next;
1278 	}
1279       size_t nbytes = (totalbits - zerobits + 7) / 8;
1280       assert (nbytes > 0);
1281       size_t leadingbytes = leadingbits / 8;
1282 
1283       fprintf (outfile, "  %#zx,", nbytes | (leadingbytes << 4));
1284 
1285       /* Now create the mask and byte values.  */
1286       uint8_t byte = 0;
1287       uint8_t mask = 0;
1288       int nbits = 0;
1289       b = instr->bytes;
1290       while (b != NULL)
1291 	{
1292 	  if (b->type == zeroone)
1293 	    {
1294 	      byte = (byte << 1) | b->value;
1295 	      mask = (mask << 1) | 1;
1296 	      if (++nbits == 8)
1297 		{
1298 		  if (leadingbytes > 0)
1299 		    {
1300 		      assert (mask == 0xff);
1301 		      fprintf (outfile, " %#" PRIx8 ",", byte);
1302 		      --leadingbytes;
1303 		    }
1304 		  else
1305 		    fprintf (outfile, " %#" PRIx8 ", %#" PRIx8 ",",
1306 			     mask, byte);
1307 		  byte = mask = nbits = 0;
1308 		  if (--nbytes == 0)
1309 		    break;
1310 		}
1311 	    }
1312 	  else
1313 	    {
1314 	      assert (leadingbytes == 0);
1315 
1316 	      unsigned long int remaining = b->field->bits;
1317 	      while (nbits + remaining > 8)
1318 		{
1319 		  fprintf (outfile, " %#" PRIx8 ", %#" PRIx8 ",",
1320 			   mask << (8 - nbits), byte << (8 - nbits));
1321 		  remaining = nbits + remaining - 8;
1322 		  byte = mask = nbits = 0;
1323 		  if (--nbytes == 0)
1324 		    break;
1325 		}
1326 	      byte <<= remaining;
1327 	      mask <<= remaining;
1328 	      nbits += remaining;
1329 	      if (nbits == 8)
1330 		{
1331 		  fprintf (outfile, " %#" PRIx8 ", %#" PRIx8 ",", mask, byte);
1332 		  byte = mask = nbits = 0;
1333 		  if (--nbytes == 0)
1334 		    break;
1335 		}
1336 	    }
1337 	  b = b->next;
1338 	}
1339 
1340       fputc_unlocked ('\n', outfile);
1341     }
1342   fputs ("};\n", outfile);
1343 }
1344 
1345 
1346 #if 0
1347 static size_t mnemonic_maxlen;
1348 static size_t mnemonic_minlen;
1349 static size_t
1350 which_chars (const char *str[], size_t nstr)
1351 {
1352   char used_char[256];
1353   memset (used_char, '\0', sizeof (used_char));
1354   mnemonic_maxlen = 0;
1355   mnemonic_minlen = 10000;
1356   for (size_t cnt = 0; cnt < nstr; ++cnt)
1357     {
1358       const unsigned char *cp = (const unsigned char *) str[cnt];
1359       mnemonic_maxlen = MAX (mnemonic_maxlen, strlen ((char *) cp));
1360       mnemonic_minlen = MIN (mnemonic_minlen, strlen ((char *) cp));
1361       do
1362         used_char[*cp++] = 1;
1363       while (*cp != '\0');
1364     }
1365   size_t nused_char = 0;
1366   for (size_t cnt = 0; cnt < 256; ++cnt)
1367     if (used_char[cnt] != 0)
1368       ++nused_char;
1369   return nused_char;
1370 }
1371 
1372 
1373 static const char **mnemonic_strs;
1374 static size_t nmnemonic_strs;
1375 static void
1376 add_mnemonics (const void *nodep, VISIT value,
1377 	       int level __attribute__ ((unused)))
1378 {
1379   if (value == leaf || value == postorder)
1380     mnemonic_strs[nmnemonic_strs++] = *(const char **) nodep;
1381 }
1382 
1383 
1384 struct charfreq
1385 {
1386   char ch;
1387   int freq;
1388 };
1389 static struct charfreq pfxfreq[256];
1390 static struct charfreq sfxfreq[256];
1391 
1392 
1393 static int
1394 compare_freq (const void *p1, const void *p2)
1395 {
1396   const struct charfreq *c1 = (const struct charfreq *) p1;
1397   const struct charfreq *c2 = (const struct charfreq *) p2;
1398 
1399   if (c1->freq > c2->freq)
1400     return -1;
1401   if (c1->freq < c2->freq)
1402     return 1;
1403   return 0;
1404 }
1405 
1406 
1407 static size_t
1408 compute_pfxfreq (const char *str[], size_t nstr)
1409 {
1410   memset (pfxfreq, '\0', sizeof (pfxfreq));
1411 
1412   for (size_t i = 0; i < nstr; ++i)
1413     pfxfreq[i].ch = i;
1414 
1415   for (size_t i = 0; i < nstr; ++i)
1416     ++pfxfreq[*((const unsigned char *) str[i])].freq;
1417 
1418   qsort (pfxfreq, 256, sizeof (struct charfreq), compare_freq);
1419 
1420   size_t n = 0;
1421   while (n < 256 && pfxfreq[n].freq != 0)
1422     ++n;
1423   return n;
1424 }
1425 
1426 
1427 struct strsnlen
1428 {
1429   const char *str;
1430   size_t len;
1431 };
1432 
1433 static size_t
1434 compute_sfxfreq (size_t nstr, struct strsnlen *strsnlen)
1435 {
1436   memset (sfxfreq, '\0', sizeof (sfxfreq));
1437 
1438   for (size_t i = 0; i < nstr; ++i)
1439     sfxfreq[i].ch = i;
1440 
1441   for (size_t i = 0; i < nstr; ++i)
1442     ++sfxfreq[((const unsigned char *) strchrnul (strsnlen[i].str, '\0'))[-1]].freq;
1443 
1444   qsort (sfxfreq, 256, sizeof (struct charfreq), compare_freq);
1445 
1446   size_t n = 0;
1447   while (n < 256 && sfxfreq[n].freq != 0)
1448     ++n;
1449   return n;
1450 }
1451 
1452 
1453 static void
1454 create_mnemonic_table (void)
1455 {
1456   mnemonic_strs = xmalloc (nmnemonics * sizeof (char *));
1457 
1458   twalk (mnemonics, add_mnemonics);
1459 
1460   (void) which_chars (mnemonic_strs, nmnemonic_strs);
1461 
1462   size_t best_so_far = 100000000;
1463   char *best_prefix = NULL;
1464   char *best_suffix = NULL;
1465   char *best_table = NULL;
1466   size_t best_table_size = 0;
1467   size_t best_table_bits = 0;
1468   size_t best_prefix_bits = 0;
1469 
1470   /* We can precompute the prefix characters.  */
1471   size_t npfx_char = compute_pfxfreq (mnemonic_strs, nmnemonic_strs);
1472 
1473   /* Compute best size for string representation including explicit NUL.  */
1474   for (size_t pfxbits = 0; (1u << pfxbits) < 2 * npfx_char; ++pfxbits)
1475     {
1476       char prefix[1 << pfxbits];
1477       size_t i;
1478       for (i = 0; i < (1u << pfxbits) - 1; ++i)
1479 	prefix[i] = pfxfreq[i].ch;
1480       prefix[i] = '\0';
1481 
1482       struct strsnlen strsnlen[nmnemonic_strs];
1483 
1484       for (i = 0; i < nmnemonic_strs; ++i)
1485 	{
1486 	  if (strchr (prefix, *mnemonic_strs[i]) != NULL)
1487 	    strsnlen[i].str = mnemonic_strs[i] + 1;
1488 	  else
1489 	    strsnlen[i].str = mnemonic_strs[i];
1490 	  strsnlen[i].len = strlen (strsnlen[i].str);
1491 	}
1492 
1493       /* With the prefixes gone, try to combine strings.  */
1494       size_t nstrsnlen = 1;
1495       for (i = 1; i < nmnemonic_strs; ++i)
1496 	{
1497 	  size_t j;
1498 	  for (j = 0; j < nstrsnlen; ++j)
1499 	    if (strsnlen[i].len > strsnlen[j].len
1500 		&& strcmp (strsnlen[j].str,
1501 			   strsnlen[i].str + (strsnlen[i].len
1502 					      - strsnlen[j].len)) == 0)
1503 	      {
1504 		strsnlen[j] = strsnlen[i];
1505 		break;
1506 	      }
1507 	    else if (strsnlen[i].len < strsnlen[j].len
1508 		     && strcmp (strsnlen[i].str,
1509 				strsnlen[j].str + (strsnlen[j].len
1510 						   - strsnlen[i].len)) == 0)
1511 	      break;
1512 ;
1513 	  if (j == nstrsnlen)
1514 	      strsnlen[nstrsnlen++] = strsnlen[i];
1515 	}
1516 
1517       size_t nsfx_char = compute_sfxfreq (nstrsnlen, strsnlen);
1518 
1519       for (size_t sfxbits = 0; (1u << sfxbits) < 2 * nsfx_char; ++sfxbits)
1520 	{
1521 	  char suffix[1 << sfxbits];
1522 
1523 	  for (i = 0; i < (1u << sfxbits) - 1; ++i)
1524 	    suffix[i] = sfxfreq[i].ch;
1525 	  suffix[i] = '\0';
1526 
1527 	  size_t newlen[nstrsnlen];
1528 
1529 	  for (i = 0; i < nstrsnlen; ++i)
1530 	    if (strchr (suffix, strsnlen[i].str[strsnlen[i].len - 1]) != NULL)
1531 	      newlen[i] = strsnlen[i].len - 1;
1532 	    else
1533 	      newlen[i] = strsnlen[i].len;
1534 
1535 	  char charused[256];
1536 	  memset (charused, '\0', sizeof (charused));
1537 	  size_t ncharused = 0;
1538 
1539 	  const char *tablestr[nstrsnlen];
1540 	  size_t ntablestr = 1;
1541 	  tablestr[0] = strsnlen[0].str;
1542 	  size_t table = newlen[0] + 1;
1543 	  for (i = 1; i < nstrsnlen; ++i)
1544 	    {
1545 	      size_t j;
1546 	      for (j = 0; j < ntablestr; ++j)
1547 		if (newlen[i] > newlen[j]
1548 		    && memcmp (tablestr[j],
1549 			       strsnlen[i].str + (newlen[i] - newlen[j]),
1550 			       newlen[j]) == 0)
1551 		  {
1552 		    table += newlen[i] - newlen[j];
1553 		    tablestr[j] = strsnlen[i].str;
1554 		    newlen[j] = newlen[i];
1555 		    break;
1556 		  }
1557 		else if (newlen[i] < newlen[j]
1558 		     && memcmp (strsnlen[i].str,
1559 				tablestr[j] + (newlen[j] - newlen[i]),
1560 				newlen[i]) == 0)
1561 		  break;
1562 
1563 	      if (j == ntablestr)
1564 		{
1565 		  table += newlen[i] + 1;
1566 		  tablestr[ntablestr] = strsnlen[i].str;
1567 		  newlen[ntablestr] = newlen[i];
1568 
1569 		  ++ntablestr;
1570 		}
1571 
1572 	      for (size_t x = 0; x < newlen[j]; ++x)
1573 		if (charused[((const unsigned char *) tablestr[j])[x]]++ == 0)
1574 		  ++ncharused;
1575 	    }
1576 
1577 	  size_t ncharused_bits = 0;
1578 	  i = 1;
1579 	  while (i < ncharused)
1580 	    {
1581 	      i *= 2;
1582 	      ++ncharused_bits;
1583 	    }
1584 
1585 	  size_t table_bits = 0;
1586 	  i = 1;
1587 	  while (i < table)
1588 	    {
1589 	      i *= 2;
1590 	      ++table_bits;
1591 	    }
1592 
1593 	  size_t mnemonic_bits = table_bits + pfxbits + sfxbits;
1594 	  size_t new_total = (((table + 7) / 8) * ncharused_bits + ncharused
1595 			      + (pfxbits == 0 ? 0 : (1 << pfxbits) - 1)
1596 			      + (sfxbits == 0 ? 0 : (1 << sfxbits) - 1)
1597 			      + (((total_bits + mnemonic_bits + 7) / 8)
1598 				 * ninstructions));
1599 
1600 	  if (new_total < best_so_far)
1601 	    {
1602 	      best_so_far = new_total;
1603 	      best_mnemonic_bits = mnemonic_bits;
1604 
1605 	      free (best_suffix);
1606 	      best_suffix = xstrdup (suffix);
1607 
1608 	      free (best_prefix);
1609 	      best_prefix = xstrdup (prefix);
1610 	      best_prefix_bits = pfxbits;
1611 
1612 	      best_table_size = table;
1613 	      best_table_bits = table_bits;
1614 	      char *cp = best_table = xrealloc (best_table, table);
1615 	      for (i = 0; i < ntablestr; ++i)
1616 		{
1617 		  assert (cp + newlen[i] + 1 <= best_table + table);
1618 		  cp = mempcpy (cp, tablestr[i], newlen[i]);
1619 		  *cp++ = '\0';
1620 		}
1621 	      assert (cp == best_table + table);
1622 	    }
1623 	}
1624     }
1625 
1626   fputs ("static const char mnemonic_table[] =\n\"", outfile);
1627   for (size_t i = 0; i < best_table_size; ++i)
1628     {
1629       if (((i + 1) % 60) == 0)
1630 	fputs ("\"\n\"", outfile);
1631       if (!isascii (best_table[i]) || !isprint (best_table[i]))
1632 	fprintf (outfile, "\\%03o", best_table[i]);
1633       else
1634 	fputc (best_table[i], outfile);
1635     }
1636   fputs ("\";\n", outfile);
1637 
1638   if (best_prefix[0] != '\0')
1639     fprintf (outfile,
1640 	     "static const char prefix[%zu] = \"%s\";\n"
1641 	     "#define PREFIXCHAR_BITS %zu\n",
1642 	     strlen (best_prefix), best_prefix, best_prefix_bits);
1643   else
1644     fputs ("#define NO_PREFIX\n", outfile);
1645 
1646   if (best_suffix[0] != '\0')
1647     fprintf (outfile, "static const char suffix[%zu] = \"%s\";\n",
1648 	     strlen (best_suffix), best_suffix);
1649   else
1650     fputs ("#define NO_SUFFIX\n", outfile);
1651 
1652   for (size_t i = 0; i < nmnemonic_strs; ++i)
1653     {
1654       const char *mne = mnemonic_strs[i];
1655 
1656       size_t pfxval = 0;
1657       char *cp = strchr (best_prefix, *mne);
1658       if (cp != NULL)
1659 	{
1660 	  pfxval = 1 + (cp - best_prefix);
1661 	  ++mne;
1662 	}
1663 
1664       size_t l = strlen (mne);
1665 
1666       size_t sfxval = 0;
1667       cp = strchr (best_suffix, mne[l - 1]);
1668       if (cp != NULL)
1669 	{
1670 	  sfxval = 1 + (cp - best_suffix);
1671 	  --l;
1672 	}
1673 
1674       char *off = memmem (best_table, best_table_size, mne, l);
1675       while (off[l] != '\0')
1676 	{
1677 	  off = memmem (off + 1, best_table_size, mne, l);
1678 	  assert (off != NULL);
1679 	}
1680 
1681       fprintf (outfile, "#define MNE_%s %#zx\n",
1682 	       mnemonic_strs[i],
1683 	       (off - best_table)
1684 	       + ((pfxval + (sfxval << best_prefix_bits)) << best_table_bits));
1685     }
1686 }
1687 #endif
1688