aboutsummaryrefslogtreecommitdiffstats
path: root/riscV/ExpansionOracle.ml
blob: 6eb8227488c65aba61cefe867d79a68454c1a445 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
(* *************************************************************)
(*                                                             *)
(*             The Compcert verified compiler                  *)
(*                                                             *)
(*           Léo Gourdin        UGA, VERIMAG                   *)
(*                                                             *)
(*  Copyright VERIMAG. All rights reserved.                    *)
(*  This file is distributed under the terms of the INRIA      *)
(*  Non-Commercial License Agreement.                          *)
(*                                                             *)
(* *************************************************************)

open RTLpathLivegenaux
open RTLpathCommon
open Datatypes
open Maps
open RTL
open Op
open Asmgen
open DebugPrint
open RTLpath
open! Integers
open Camlcoq
open Option

type sop = Sop of operation * P.t list

type sval = Si of RTL.instruction | Sr of P.t

let reg = ref 1

let node = ref 1

let p2i r = P.to_int r

let r2p () = P.of_int !reg

let n2p () = P.of_int !node

let r2pi () =
  reg := !reg + 1;
  r2p ()

let n2pi () =
  node := !node + 1;
  n2p ()

type immt =
  | Addiw
  | Addil
  | Andiw
  | Andil
  | Oriw
  | Oril
  | Xoriw
  | Xoril
  | Sltiw
  | Sltiuw
  | Sltil
  | Sltiul

let find_or_addnmove op args rd succ map_consts not_final =
  let sop = Sop (op, args) in
  match Hashtbl.find_opt map_consts sop with
  | Some r ->
      if not_final then node := !node - 1;
      Sr (P.of_int r)
  | None ->
      if not (List.exists (fun a -> a = rd) args) && not_final then
        Hashtbl.add map_consts sop (p2i rd);
      Si (Iop (op, args, rd, succ))

let build_head_tuple head sv =
  match sv with Si i -> (head @ [ i ], None) | Sr r -> (head, Some r)

let unzip_head_tuple ht r = match ht with l, Some r' -> r' | l, None -> r

let unzip_head_tuple_move ht r succ =
  match ht with
  | l, Some r' ->
      if r' != r then [ Iop (Omove, [ r' ], r, succ) ] else [ Inop succ ]
  | l, None -> l

let build_full_ilist op args dest succ hd k map_consts =
  let sv = find_or_addnmove op args dest succ map_consts false in
  let ht = build_head_tuple hd sv in
  unzip_head_tuple_move ht dest succ @ k

let load_hilo32 dest hi lo succ map_consts not_final =
  let op1 = OEluiw hi in
  if Int.eq lo Int.zero then
    let sv = find_or_addnmove op1 [] dest succ map_consts not_final in
    build_head_tuple [] sv
  else
    let r = r2pi () in
    let sv1 = find_or_addnmove op1 [] r (n2pi ()) map_consts not_final in
    let ht1 = build_head_tuple [] sv1 in
    let r' = unzip_head_tuple ht1 r in
    let op2 = OEaddiw lo in
    let sv2 = find_or_addnmove op2 [ r' ] dest succ map_consts not_final in
    build_head_tuple (fst ht1) sv2

let load_hilo64 dest hi lo succ map_consts not_final =
  let op1 = OEluil hi in
  if Int64.eq lo Int64.zero then
    let sv = find_or_addnmove op1 [] dest succ map_consts not_final in
    build_head_tuple [] sv
  else
    let r = r2pi () in
    let sv1 = find_or_addnmove op1 [] r (n2pi ()) map_consts not_final in
    let ht1 = build_head_tuple [] sv1 in
    let r' = unzip_head_tuple ht1 r in
    let op2 = OEaddil lo in
    let sv2 = find_or_addnmove op2 [ r' ] dest succ map_consts not_final in
    build_head_tuple (fst ht1) sv2

let loadimm32 dest n succ map_consts not_final =
  match make_immed32 n with
  | Imm32_single imm ->
      let op1 = OEaddiwr0 imm in
      let sv = find_or_addnmove op1 [] dest succ map_consts not_final in
      build_head_tuple [] sv
  | Imm32_pair (hi, lo) -> load_hilo32 dest hi lo succ map_consts not_final

let loadimm64 dest n succ map_consts not_final =
  match make_immed64 n with
  | Imm64_single imm ->
      let op1 = OEaddilr0 imm in
      let sv = find_or_addnmove op1 [] dest succ map_consts not_final in
      build_head_tuple [] sv
  | Imm64_pair (hi, lo) -> load_hilo64 dest hi lo succ map_consts not_final
  | Imm64_large imm ->
      let op1 = OEloadli imm in
      let sv = find_or_addnmove op1 [] dest succ map_consts not_final in
      build_head_tuple [] sv

let get_opimm imm = function
  | Addiw -> OEaddiw imm
  | Andiw -> OEandiw imm
  | Oriw -> OEoriw imm
  | Xoriw -> OExoriw imm
  | Sltiw -> OEsltiw imm
  | Sltiuw -> OEsltiuw imm
  | Addil -> OEaddil imm
  | Andil -> OEandil imm
  | Oril -> OEoril imm
  | Xoril -> OExoril imm
  | Sltil -> OEsltil imm
  | Sltiul -> OEsltiul imm

let opimm32 a1 dest n succ k op opimm map_consts =
  match make_immed32 n with
  | Imm32_single imm ->
      build_full_ilist (get_opimm imm opimm) [ a1 ] dest succ [] k map_consts
  | Imm32_pair (hi, lo) ->
      let r = r2pi () in
      let ht = load_hilo32 r hi lo (n2pi ()) map_consts true in
      let r' = unzip_head_tuple ht r in
      build_full_ilist op [ a1; r' ] dest succ (fst ht) k map_consts

let opimm64 a1 dest n succ k op opimm map_consts =
  match make_immed64 n with
  | Imm64_single imm ->
      build_full_ilist (get_opimm imm opimm) [ a1 ] dest succ [] k map_consts
  | Imm64_pair (hi, lo) ->
      let r = r2pi () in
      let ht = load_hilo64 r hi lo (n2pi ()) map_consts true in
      let r' = unzip_head_tuple ht r in
      build_full_ilist op [ a1; r' ] dest succ (fst ht) k map_consts
  | Imm64_large imm ->
      let r = r2pi () in
      let op1 = OEloadli imm in
      let inode = n2pi () in
      let sv = find_or_addnmove op1 [] r inode map_consts true in
      let ht = build_head_tuple [] sv in
      let r' = unzip_head_tuple ht r in
      build_full_ilist op [ a1; r' ] dest succ (fst ht) k map_consts

let addimm32 a1 dest n succ k map_consts =
  opimm32 a1 dest n succ k Oadd Addiw map_consts

let andimm32 a1 dest n succ k map_consts =
  opimm32 a1 dest n succ k Oand Andiw map_consts

let orimm32 a1 dest n succ k map_consts =
  opimm32 a1 dest n succ k Oor Oriw map_consts

let xorimm32 a1 dest n succ k map_consts =
  opimm32 a1 dest n succ k Oxor Xoriw map_consts

let sltimm32 a1 dest n succ k map_consts =
  opimm32 a1 dest n succ k (OEsltw None) Sltiw map_consts

let sltuimm32 a1 dest n succ k map_consts =
  opimm32 a1 dest n succ k (OEsltuw None) Sltiuw map_consts

let addimm64 a1 dest n succ k = opimm64 a1 dest n succ k Oaddl Addil

let andimm64 a1 dest n succ k = opimm64 a1 dest n succ k Oandl Andil

let orimm64 a1 dest n succ k = opimm64 a1 dest n succ k Oorl Oril

let xorimm64 a1 dest n succ k = opimm64 a1 dest n succ k Oxorl Xoril

let sltimm64 a1 dest n succ k = opimm64 a1 dest n succ k (OEsltl None) Sltil

let sltuimm64 a1 dest n succ k = opimm64 a1 dest n succ k (OEsltul None) Sltiul

let is_inv_cmp = function Cle | Cgt -> true | _ -> false

let make_optR0 is_x0 is_inv = if is_x0 then Some is_inv else None

let cbranch_int32s is_x0 cmp a1 a2 info succ1 succ2 k =
  let optR0 = make_optR0 is_x0 (is_inv_cmp cmp) in
  match cmp with
  | Ceq -> Icond (CEbeqw optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Cne -> Icond (CEbnew optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Clt -> Icond (CEbltw optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Cle -> Icond (CEbgew optR0, [ a2; a1 ], succ1, succ2, info) :: k
  | Cgt -> Icond (CEbltw optR0, [ a2; a1 ], succ1, succ2, info) :: k
  | Cge -> Icond (CEbgew optR0, [ a1; a2 ], succ1, succ2, info) :: k

let cbranch_int32u is_x0 cmp a1 a2 info succ1 succ2 k =
  let optR0 = make_optR0 is_x0 (is_inv_cmp cmp) in
  match cmp with
  | Ceq -> Icond (CEbequw optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Cne -> Icond (CEbneuw optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Clt -> Icond (CEbltuw optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Cle -> Icond (CEbgeuw optR0, [ a2; a1 ], succ1, succ2, info) :: k
  | Cgt -> Icond (CEbltuw optR0, [ a2; a1 ], succ1, succ2, info) :: k
  | Cge -> Icond (CEbgeuw optR0, [ a1; a2 ], succ1, succ2, info) :: k

let cbranch_int64s is_x0 cmp a1 a2 info succ1 succ2 k =
  let optR0 = make_optR0 is_x0 (is_inv_cmp cmp) in
  match cmp with
  | Ceq -> Icond (CEbeql optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Cne -> Icond (CEbnel optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Clt -> Icond (CEbltl optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Cle -> Icond (CEbgel optR0, [ a2; a1 ], succ1, succ2, info) :: k
  | Cgt -> Icond (CEbltl optR0, [ a2; a1 ], succ1, succ2, info) :: k
  | Cge -> Icond (CEbgel optR0, [ a1; a2 ], succ1, succ2, info) :: k

let cbranch_int64u is_x0 cmp a1 a2 info succ1 succ2 k =
  let optR0 = make_optR0 is_x0 (is_inv_cmp cmp) in
  match cmp with
  | Ceq -> Icond (CEbequl optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Cne -> Icond (CEbneul optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Clt -> Icond (CEbltul optR0, [ a1; a2 ], succ1, succ2, info) :: k
  | Cle -> Icond (CEbgeul optR0, [ a2; a1 ], succ1, succ2, info) :: k
  | Cgt -> Icond (CEbltul optR0, [ a2; a1 ], succ1, succ2, info) :: k
  | Cge -> Icond (CEbgeul optR0, [ a1; a2 ], succ1, succ2, info) :: k

let cond_int32s is_x0 cmp a1 a2 dest tmp_reg succ map_consts =
  let optR0 = make_optR0 is_x0 (is_inv_cmp cmp) in
  match cmp with
  | Ceq -> [ Iop (OEseqw optR0, [ a1; a2 ], dest, succ) ]
  | Cne -> [ Iop (OEsnew optR0, [ a1; a2 ], dest, succ) ]
  | Clt -> [ Iop (OEsltw optR0, [ a1; a2 ], dest, succ) ]
  | Cle ->
      let r = r2pi () in
      let op = OEsltw optR0 in
      let sv = find_or_addnmove op [ a2; a1 ] r (get tmp_reg) map_consts true in
      let ht = build_head_tuple [] sv in
      let r' = unzip_head_tuple ht r in
      fst ht @ [ Iop (OExoriw Int.one, [ r' ], dest, succ) ]
  | Cgt -> [ Iop (OEsltw optR0, [ a2; a1 ], dest, succ) ]
  | Cge ->
      let r = r2pi () in
      let op = OEsltw optR0 in
      let sv = find_or_addnmove op [ a1; a2 ] r (get tmp_reg) map_consts true in
      let ht = build_head_tuple [] sv in
      let r' = unzip_head_tuple ht r in
      fst ht @ [ Iop (OExoriw Int.one, [ r' ], dest, succ) ]

let cond_int32u is_x0 cmp a1 a2 dest tmp_reg succ map_consts =
  let optR0 = make_optR0 is_x0 (is_inv_cmp cmp) in
  match cmp with
  | Ceq -> [ Iop (OEsequw optR0, [ a1; a2 ], dest, succ) ]
  | Cne -> [ Iop (OEsneuw optR0, [ a1; a2 ], dest, succ) ]
  | Clt -> [ Iop (OEsltuw optR0, [ a1; a2 ], dest, succ) ]
  | Cle ->
      let r = r2pi () in
      let op = OEsltuw optR0 in
      let sv = find_or_addnmove op [ a2; a1 ] r (get tmp_reg) map_consts true in
      let ht = build_head_tuple [] sv in
      let r' = unzip_head_tuple ht r in
      fst ht @ [ Iop (OExoriw Int.one, [ r' ], dest, succ) ]
  | Cgt -> [ Iop (OEsltuw optR0, [ a2; a1 ], dest, succ) ]
  | Cge ->
      let r = r2pi () in
      let op = OEsltuw optR0 in
      let sv = find_or_addnmove op [ a1; a2 ] r (get tmp_reg) map_consts true in
      let ht = build_head_tuple [] sv in
      let r' = unzip_head_tuple ht r in
      fst ht @ [ Iop (OExoriw Int.one, [ r' ], dest, succ) ]

let cond_int64s is_x0 cmp a1 a2 dest tmp_reg succ map_consts =
  let optR0 = make_optR0 is_x0 (is_inv_cmp cmp) in
  match cmp with
  | Ceq -> [ Iop (OEseql optR0, [ a1; a2 ], dest, succ) ]
  | Cne -> [ Iop (OEsnel optR0, [ a1; a2 ], dest, succ) ]
  | Clt -> [ Iop (OEsltl optR0, [ a1; a2 ], dest, succ) ]
  | Cle ->
      let r = r2pi () in
      let op = OEsltl optR0 in
      let sv = find_or_addnmove op [ a2; a1 ] r (get tmp_reg) map_consts true in
      let ht = build_head_tuple [] sv in
      let r' = unzip_head_tuple ht r in
      fst ht @ [ Iop (OExoriw Int.one, [ r' ], dest, succ) ]
  | Cgt -> [ Iop (OEsltl optR0, [ a2; a1 ], dest, succ) ]
  | Cge ->
      let r = r2pi () in
      let op = OEsltl optR0 in
      let sv = find_or_addnmove op [ a1; a2 ] r (get tmp_reg) map_consts true in
      let ht = build_head_tuple [] sv in
      let r' = unzip_head_tuple ht r in
      fst ht @ [ Iop (OExoriw Int.one, [ r' ], dest, succ) ]

let cond_int64u is_x0 cmp a1 a2 dest tmp_reg succ map_consts =
  let optR0 = make_optR0 is_x0 (is_inv_cmp cmp) in
  match cmp with
  | Ceq -> [ Iop (OEsequl optR0, [ a1; a2 ], dest, succ) ]
  | Cne -> [ Iop (OEsneul optR0, [ a1; a2 ], dest, succ) ]
  | Clt -> [ Iop (OEsltul optR0, [ a1; a2 ], dest, succ) ]
  | Cle ->
      let r = r2pi () in
      let op = OEsltul optR0 in
      let sv = find_or_addnmove op [ a2; a1 ] r (get tmp_reg) map_consts true in
      let ht = build_head_tuple [] sv in
      let r' = unzip_head_tuple ht r in
      fst ht @ [ Iop (OExoriw Int.one, [ r' ], dest, succ) ]
  | Cgt -> [ Iop (OEsltul optR0, [ a2; a1 ], dest, succ) ]
  | Cge ->
      let r = r2pi () in
      let op = OEsltul optR0 in
      let sv = find_or_addnmove op [ a1; a2 ] r (get tmp_reg) map_consts true in
      let ht = build_head_tuple [] sv in
      let r' = unzip_head_tuple ht r in
      fst ht @ [ Iop (OExoriw Int.one, [ r' ], dest, succ) ]

let is_normal_cmp = function Cne -> false | _ -> true

let cond_float cmp f1 f2 dest succ map_consts =
  match cmp with
  | Ceq -> [ Iop (OEfeqd, [ f1; f2 ], dest, succ) ]
  | Cne -> [ Iop (OEfeqd, [ f1; f2 ], dest, succ) ]
  | Clt -> [ Iop (OEfltd, [ f1; f2 ], dest, succ) ]
  | Cle -> [ Iop (OEfled, [ f1; f2 ], dest, succ) ]
  | Cgt -> [ Iop (OEfltd, [ f2; f1 ], dest, succ) ]
  | Cge -> [ Iop (OEfled, [ f2; f1 ], dest, succ) ]

let cond_single cmp f1 f2 dest succ map_consts =
  match cmp with
  | Ceq -> [ Iop (OEfeqs, [ f1; f2 ], dest, succ) ]
  | Cne -> [ Iop (OEfeqs, [ f1; f2 ], dest, succ) ]
  | Clt -> [ Iop (OEflts, [ f1; f2 ], dest, succ) ]
  | Cle -> [ Iop (OEfles, [ f1; f2 ], dest, succ) ]
  | Cgt -> [ Iop (OEflts, [ f2; f1 ], dest, succ) ]
  | Cge -> [ Iop (OEfles, [ f2; f1 ], dest, succ) ]

let expanse_cbranchimm_int32s cmp a1 n info succ1 succ2 k map_consts =
  if Int.eq n Int.zero then cbranch_int32s true cmp a1 a1 info succ1 succ2 k
  else
    let r = r2pi () in
    let ht = loadimm32 r n (n2pi ()) map_consts true in
    let r' = unzip_head_tuple ht r in
    fst ht @ cbranch_int32s false cmp a1 r' info succ1 succ2 k

let expanse_cbranchimm_int32u cmp a1 n info succ1 succ2 k map_consts =
  if Int.eq n Int.zero then cbranch_int32u true cmp a1 a1 info succ1 succ2 k
  else
    let r = r2pi () in
    let ht = loadimm32 r n (n2pi ()) map_consts true in
    let r' = unzip_head_tuple ht r in
    fst ht @ cbranch_int32u false cmp a1 r' info succ1 succ2 k

let expanse_cbranchimm_int64s cmp a1 n info succ1 succ2 k map_consts =
  if Int64.eq n Int64.zero then cbranch_int64s true cmp a1 a1 info succ1 succ2 k
  else
    let r = r2pi () in
    let ht = loadimm64 r n (n2pi ()) map_consts true in
    let r' = unzip_head_tuple ht r in
    fst ht @ cbranch_int64s false cmp a1 r' info succ1 succ2 k

let expanse_cbranchimm_int64u cmp a1 n info succ1 succ2 k map_consts =
  if Int64.eq n Int64.zero then cbranch_int64u true cmp a1 a1 info succ1 succ2 k
  else
    let r = r2pi () in
    let ht = loadimm64 r n (n2pi ()) map_consts true in
    let r' = unzip_head_tuple ht r in
    fst ht @ cbranch_int64u false cmp a1 r' info succ1 succ2 k

let get_tmp_reg = function Cle | Cge -> Some (n2pi ()) | _ -> None

let expanse_condimm_int32s cmp a1 n dest succ map_consts =
  if Int.eq n Int.zero then
    let tmp_reg = get_tmp_reg cmp in
    cond_int32s true cmp a1 a1 dest tmp_reg succ map_consts
  else
    match cmp with
    | Ceq | Cne ->
        let r = r2pi () in
        xorimm32 a1 r n (n2pi ())
          (cond_int32s true cmp r r dest None succ map_consts)
          map_consts
    | Clt -> sltimm32 a1 dest n succ [] map_consts
    | Cle ->
        if Int.eq n (Int.repr Int.max_signed) then
          let ht = loadimm32 dest Int.one succ map_consts false in
          fst ht
        else sltimm32 a1 dest (Int.add n Int.one) succ [] map_consts
    | _ ->
        let r = r2pi () in
        let tmp_reg = get_tmp_reg cmp in
        let ht = loadimm32 r n (n2pi ()) map_consts true in
        let r' = unzip_head_tuple ht r in
        fst ht @ cond_int32s false cmp a1 r' dest tmp_reg succ map_consts

let expanse_condimm_int32u cmp a1 n dest succ map_consts =
  let tmp_reg = get_tmp_reg cmp in
  if Int.eq n Int.zero then
    cond_int32u true cmp a1 a1 dest tmp_reg succ map_consts
  else
    match cmp with
    | Clt -> sltuimm32 a1 dest n succ [] map_consts
    | _ ->
        let r = r2pi () in
        let ht = loadimm32 r n (n2pi ()) map_consts true in
        let r' = unzip_head_tuple ht r in
        fst ht @ cond_int32u false cmp a1 r' dest tmp_reg succ map_consts

let expanse_condimm_int64s cmp a1 n dest succ map_consts =
  if Int64.eq n Int64.zero then
    let tmp_reg = get_tmp_reg cmp in
    cond_int64s true cmp a1 a1 dest tmp_reg succ map_consts
  else
    match cmp with
    | Ceq | Cne ->
        let r = r2pi () in
        xorimm64 a1 r n (n2pi ())
          (cond_int64s true cmp r r dest None succ map_consts)
          map_consts
    | Clt -> sltimm64 a1 dest n succ [] map_consts
    | Cle ->
        if Int64.eq n (Int64.repr Int64.max_signed) then
          let ht = loadimm32 dest Int.one succ map_consts false in
          fst ht
        else sltimm64 a1 dest (Int64.add n Int64.one) succ [] map_consts
    | _ ->
        let r = r2pi () in
        let tmp_reg = get_tmp_reg cmp in
        let ht = loadimm64 r n (n2pi ()) map_consts true in
        let r' = unzip_head_tuple ht r in
        fst ht @ cond_int64s false cmp a1 r' dest tmp_reg succ map_consts

let expanse_condimm_int64u cmp a1 n dest succ map_consts =
  let tmp_reg = get_tmp_reg cmp in
  if Int64.eq n Int64.zero then
    cond_int64u true cmp a1 a1 dest tmp_reg succ map_consts
  else
    match cmp with
    | Clt -> sltuimm64 a1 dest n succ [] map_consts
    | _ ->
        let r = r2pi () in
        let ht = loadimm64 r n (n2pi ()) map_consts true in
        let r' = unzip_head_tuple ht r in
        fst ht @ cond_int64u false cmp a1 r' dest tmp_reg succ map_consts

let expanse_cond_fp cnot fn_cond cmp f1 f2 dest succ map_consts =
  let normal = is_normal_cmp cmp in
  let normal' = if cnot then not normal else normal in
  let succ' = if normal' then succ else n2pi () in
  let insn = fn_cond cmp f1 f2 dest succ' map_consts in
  if normal' then insn
  else build_full_ilist (OExoriw Int.one) [ dest ] dest succ insn [] map_consts

let expanse_cbranch_fp cnot fn_cond cmp f1 f2 info succ1 succ2 map_consts =
  let r = r2pi () in
  let normal = is_normal_cmp cmp in
  let normal' = if cnot then not normal else normal in
  let insn = List.hd (fn_cond cmp f1 f2 r (n2pi ()) map_consts) in
  insn
  ::
  (if normal' then [ Icond (CEbnew (Some false), [ r; r ], succ1, succ2, info) ]
  else [ Icond (CEbeqw (Some false), [ r; r ], succ1, succ2, info) ])

let get_regindent = function Coq_inr _ -> [] | Coq_inl r -> [ r ]

let get_regs_inst = function
  | Inop _ -> []
  | Iop (_, args, dest, _) -> dest :: args
  | Iload (_, _, _, args, dest, _) -> dest :: args
  | Istore (_, _, args, src, _) -> src :: args
  | Icall (_, t, args, dest, _) -> dest :: (get_regindent t @ args)
  | Itailcall (_, t, args) -> get_regindent t @ args
  | Ibuiltin (_, args, dest, _) ->
      AST.params_of_builtin_res dest @ AST.params_of_builtin_args args
  | Icond (_, args, _, _, _) -> args
  | Ijumptable (arg, _) -> [ arg ]
  | Ireturn (Some r) -> [ r ]
  | _ -> []

let write_initial_node initial code' new_order =
  code' := PTree.set initial (Inop (n2p ())) !code';
  new_order := initial :: !new_order

let write_pathmap initial esize pm' =
  let path = get_some @@ PTree.get initial !pm' in
  let npsize = Camlcoq.Nat.of_int (esize + Camlcoq.Nat.to_int path.psize) in
  let path' =
    {
      psize = npsize;
      input_regs = path.input_regs;
      pre_output_regs = path.pre_output_regs;
      output_regs = path.output_regs;
    }
  in
  pm' := PTree.set initial path' !pm'

let rec write_tree exp initial current code' new_order fturn =
  (*Printf.eprintf "wt: node is %d\n" !node;*)
  let target_node, next_node =
    if fturn then (P.to_int initial, current) else (current, current - 1)
  in
  match exp with
  | inst :: k ->
      (*let open PrintRTL in*)
      (*print_instruction stderr (target_node, inst);*)
      code' := PTree.set (P.of_int target_node) inst !code';
      new_order := P.of_int target_node :: !new_order;
      write_tree k initial next_node code' new_order false
  | [] -> ()

let expanse (sb : superblock) code pm =
  (*debug_flag := true;*)
  let new_order = ref [] in
  let liveins = ref sb.liveins in
  let exp = ref [] in
  let was_branch = ref false in
  let was_exp = ref false in
  let code' = ref code in
  let pm' = ref pm in
  let map_consts = Hashtbl.create 100 in
  Array.iter
    (fun n ->
      was_branch := false;
      was_exp := false;
      let inst = get_some @@ PTree.get n code in
      (if !Clflags.option_fexpanse_rtlcond then
       match inst with
       (* Expansion of conditions - Ocmp *)
       | Iop (Ocmp (Ccomp c), a1 :: a2 :: nil, dest, succ) ->
           debug "Iop/Ccomp\n";
           let tmp_reg = get_tmp_reg c in
           exp := cond_int32s false c a1 a2 dest tmp_reg succ map_consts;
           was_exp := true
       | Iop (Ocmp (Ccompu c), a1 :: a2 :: nil, dest, succ) ->
           debug "Iop/Ccompu\n";
           let tmp_reg = get_tmp_reg c in
           exp := cond_int32u false c a1 a2 dest tmp_reg succ map_consts;
           was_exp := true
       | Iop (Ocmp (Ccompimm (c, imm)), a1 :: nil, dest, succ) ->
           debug "Iop/Ccompimm\n";
           exp := expanse_condimm_int32s c a1 imm dest succ map_consts;
           was_exp := true
       | Iop (Ocmp (Ccompuimm (c, imm)), a1 :: nil, dest, succ) ->
           debug "Iop/Ccompuimm\n";
           exp := expanse_condimm_int32u c a1 imm dest succ map_consts;
           was_exp := true
       | Iop (Ocmp (Ccompl c), a1 :: a2 :: nil, dest, succ) ->
           debug "Iop/Ccompl\n";
           let tmp_reg = get_tmp_reg c in
           exp := cond_int64s false c a1 a2 dest tmp_reg succ map_consts;
           was_exp := true
       | Iop (Ocmp (Ccomplu c), a1 :: a2 :: nil, dest, succ) ->
           debug "Iop/Ccomplu\n";
           let tmp_reg = get_tmp_reg c in
           exp := cond_int64u false c a1 a2 dest tmp_reg succ map_consts;
           was_exp := true
       | Iop (Ocmp (Ccomplimm (c, imm)), a1 :: nil, dest, succ) ->
           debug "Iop/Ccomplimm\n";
           exp := expanse_condimm_int64s c a1 imm dest succ map_consts;
           was_exp := true
       | Iop (Ocmp (Ccompluimm (c, imm)), a1 :: nil, dest, succ) ->
           debug "Iop/Ccompluimm\n";
           exp := expanse_condimm_int64u c a1 imm dest succ map_consts;
           was_exp := true
       | Iop (Ocmp (Ccompf c), f1 :: f2 :: nil, dest, succ) ->
           debug "Iop/Ccompf\n";
           exp := expanse_cond_fp false cond_float c f1 f2 dest succ map_consts;
           was_exp := true
       | Iop (Ocmp (Cnotcompf c), f1 :: f2 :: nil, dest, succ) ->
           debug "Iop/Cnotcompf\n";
           exp := expanse_cond_fp true cond_float c f1 f2 dest succ map_consts;
           was_exp := true
       | Iop (Ocmp (Ccompfs c), f1 :: f2 :: nil, dest, succ) ->
           debug "Iop/Ccompfs\n";
           exp := expanse_cond_fp false cond_single c f1 f2 dest succ map_consts;
           was_exp := true
       | Iop (Ocmp (Cnotcompfs c), f1 :: f2 :: nil, dest, succ) ->
           debug "Iop/Cnotcompfs\n";
           exp := expanse_cond_fp true cond_single c f1 f2 dest succ map_consts;
           was_exp := true
       (* Expansion of branches - Ccomp *)
       | Icond (Ccomp c, a1 :: a2 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccomp\n";
           exp := cbranch_int32s false c a1 a2 info succ1 succ2 [];
           was_branch := true;
           was_exp := true
       | Icond (Ccompu c, a1 :: a2 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccompu\n";
           exp := cbranch_int32u false c a1 a2 info succ1 succ2 [];
           was_branch := true;
           was_exp := true
       | Icond (Ccompimm (c, imm), a1 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccompimm\n";
           exp :=
             expanse_cbranchimm_int32s c a1 imm info succ1 succ2 [] map_consts;
           was_branch := true;
           was_exp := true
       | Icond (Ccompuimm (c, imm), a1 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccompuimm\n";
           exp :=
             expanse_cbranchimm_int32u c a1 imm info succ1 succ2 [] map_consts;
           was_branch := true;
           was_exp := true
       | Icond (Ccompl c, a1 :: a2 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccompl\n";
           exp := cbranch_int64s false c a1 a2 info succ1 succ2 [];
           was_branch := true;
           was_exp := true
       | Icond (Ccomplu c, a1 :: a2 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccomplu\n";
           exp := cbranch_int64u false c a1 a2 info succ1 succ2 [];
           was_branch := true;
           was_exp := true
       | Icond (Ccomplimm (c, imm), a1 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccomplimm\n";
           exp :=
             expanse_cbranchimm_int64s c a1 imm info succ1 succ2 [] map_consts;
           was_branch := true;
           was_exp := true
       | Icond (Ccompluimm (c, imm), a1 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccompluimm\n";
           exp :=
             expanse_cbranchimm_int64u c a1 imm info succ1 succ2 [] map_consts;
           was_branch := true;
           was_exp := true
       | Icond (Ccompf c, f1 :: f2 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccompf\n";
           exp :=
             expanse_cbranch_fp false cond_float c f1 f2 info succ1 succ2
               map_consts;
           was_branch := true;
           was_exp := true
       | Icond (Cnotcompf c, f1 :: f2 :: nil, succ1, succ2, info) ->
           debug "Icond/Cnotcompf\n";
           exp :=
             expanse_cbranch_fp true cond_float c f1 f2 info succ1 succ2
               map_consts;
           was_branch := true;
           was_exp := true
       | Icond (Ccompfs c, f1 :: f2 :: nil, succ1, succ2, info) ->
           debug "Icond/Ccompfs\n";
           exp :=
             expanse_cbranch_fp false cond_single c f1 f2 info succ1 succ2
               map_consts;
           was_branch := true;
           was_exp := true
       | Icond (Cnotcompfs c, f1 :: f2 :: nil, succ1, succ2, info) ->
           debug "Icond/Cnotcompfs\n";
           exp :=
             expanse_cbranch_fp true cond_single c f1 f2 info succ1 succ2
               map_consts;
           was_branch := true;
           was_exp := true
       | _ -> ());
      (if !Clflags.option_fexpanse_others && not !was_exp then
       match inst with
       (* Expansion of fp constants *)
       | Iop (Ofloatconst f, nil, dest, succ) ->
           debug "Iop/Ofloatconst\n";
           let r = r2pi () in
           let ht =
             loadimm64 r (Floats.Float.to_bits f) (n2pi ()) map_consts true
           in
           let r' = unzip_head_tuple ht r in
           exp :=
             build_full_ilist Ofloat_of_bits [ r' ] dest succ (fst ht) []
               map_consts;
           was_exp := true
       | Iop (Osingleconst f, nil, dest, succ) ->
           debug "Iop/Osingleconst\n";
           let r = r2pi () in
           let ht =
             loadimm32 r (Floats.Float32.to_bits f) (n2pi ()) map_consts true
           in
           let r' = unzip_head_tuple ht r in
           exp :=
             build_full_ilist Osingle_of_bits [ r' ] dest succ (fst ht) []
               map_consts;
           was_exp := true
       | Iop (Ointconst n, nil, dest, succ) ->
           debug "Iop/Ointconst\n";
           let ht = loadimm32 dest n succ map_consts false in
           exp := unzip_head_tuple_move ht dest succ;
           was_exp := true
       | Iop (Olongconst n, nil, dest, succ) ->
           debug "Iop/Olongconst\n";
           let ht = loadimm64 dest n succ map_consts false in
           exp := unzip_head_tuple_move ht dest succ;
           was_exp := true
       | Iop (Oaddimm n, a1 :: nil, dest, succ) ->
           debug "Iop/Oaddimm\n";
           exp := addimm32 a1 dest n succ [] map_consts;
           was_exp := true
       | Iop (Oaddlimm n, a1 :: nil, dest, succ) ->
           debug "Iop/Oaddlimm\n";
           exp := addimm64 a1 dest n succ [] map_consts;
           was_exp := true
       | Iop (Oandimm n, a1 :: nil, dest, succ) ->
           debug "Iop/Oandimm\n";
           exp := andimm32 a1 dest n succ [] map_consts;
           was_exp := true
       | Iop (Oandlimm n, a1 :: nil, dest, succ) ->
           debug "Iop/Oandlimm\n";
           exp := andimm64 a1 dest n succ [] map_consts;
           was_exp := true
       | Iop (Oorimm n, a1 :: nil, dest, succ) ->
           debug "Iop/Oorimm\n";
           exp := orimm32 a1 dest n succ [] map_consts;
           was_exp := true
       | Iop (Oorlimm n, a1 :: nil, dest, succ) ->
           debug "Iop/Oorlimm\n";
           exp := orimm64 a1 dest n succ [] map_consts;
           was_exp := true
       | Iop (Ocast8signed, a1 :: nil, dest, succ) ->
           debug "Iop/cast8signed";
           let op = Oshlimm (Int.repr (Z.of_sint 24)) in
           let r = r2pi () in
           let sv = find_or_addnmove op [ a1 ] r (n2pi ()) map_consts true in
           let ht = build_head_tuple [] sv in
           let r' = unzip_head_tuple ht r in
           exp :=
             build_full_ilist
               (Oshrimm (Int.repr (Z.of_sint 24)))
               [ r' ] dest succ (fst ht) [] map_consts;
           was_exp := true
       | Iop (Ocast16signed, a1 :: nil, dest, succ) ->
           debug "Iop/cast8signed";
           let op = Oshlimm (Int.repr (Z.of_sint 16)) in
           let r = r2pi () in
           let sv = find_or_addnmove op [ a1 ] r (n2pi ()) map_consts true in
           let ht = build_head_tuple [] sv in
           let r' = unzip_head_tuple ht r in
           exp :=
             build_full_ilist
               (Oshrimm (Int.repr (Z.of_sint 16)))
               [ r' ] dest succ (fst ht) [] map_consts;
           was_exp := true
       | Iop (Ocast32unsigned, a1 :: nil, dest, succ) ->
           debug "Iop/Ocast32unsigned";
           let n2 = n2pi () in
           let n1 = n2pi () in
           let r1 = r2pi () in
           let r2 = r2pi () in
           let op1 = Ocast32signed in
           let sv1 = find_or_addnmove op1 [ a1 ] r1 n1 map_consts true in
           let ht1 = build_head_tuple [] sv1 in
           let r1' = unzip_head_tuple ht1 r1 in

           let op2 = Oshllimm (Int.repr (Z.of_sint 32)) in
           let sv2 = find_or_addnmove op2 [ r1' ] r2 n2 map_consts true in
           let ht2 = build_head_tuple (fst ht1) sv2 in
           let r2' = unzip_head_tuple ht2 r2 in

           let op3 = Oshrluimm (Int.repr (Z.of_sint 32)) in
           exp := build_full_ilist op3 [ r2' ] dest succ (fst ht2) [] map_consts
       | Iop (Oshrximm n, a1 :: nil, dest, succ) ->
           debug "Iop/Oshrximm";
           if Int.eq n Int.zero then exp := [ Iop (Omove, [ a1 ], dest, succ) ]
           else if Int.eq n Int.one then
             let n2 = n2pi () in
             let n1 = n2pi () in
             let r1 = r2pi () in
             let r2 = r2pi () in
             let op1 = Oshruimm (Int.repr (Z.of_sint 31)) in
             let sv1 = find_or_addnmove op1 [ a1 ] r1 n1 map_consts true in
             let ht1 = build_head_tuple [] sv1 in
             let r1' = unzip_head_tuple ht1 r1 in

             let op2 = Oadd in
             let sv2 = find_or_addnmove op2 [ a1; r1' ] r2 n2 map_consts true in
             let ht2 = build_head_tuple (fst ht1) sv2 in
             let r2' = unzip_head_tuple ht2 r2 in

             let op3 = Oshrimm Int.one in
             exp :=
               build_full_ilist op3 [ r2' ] dest succ (fst ht2) [] map_consts
           else
             let n3 = n2pi () in
             let n2 = n2pi () in
             let n1 = n2pi () in
             let r1 = r2pi () in
             let r2 = r2pi () in
             let r3 = r2pi () in
             let op1 = Oshrimm (Int.repr (Z.of_sint 31)) in
             let sv1 = find_or_addnmove op1 [ a1 ] r1 n1 map_consts true in
             let ht1 = build_head_tuple [] sv1 in
             let r1' = unzip_head_tuple ht1 r1 in

             let op2 = Oshruimm (Int.sub Int.iwordsize n) in
             let sv2 = find_or_addnmove op2 [ r1' ] r2 n2 map_consts true in
             let ht2 = build_head_tuple (fst ht1) sv2 in
             let r2' = unzip_head_tuple ht2 r2 in

             let op3 = Oadd in
             let sv3 = find_or_addnmove op3 [ a1; r2' ] r3 n3 map_consts true in
             let ht3 = build_head_tuple (fst ht2) sv3 in
             let r3' = unzip_head_tuple ht3 r3 in

             let op4 = Oshrimm n in
             exp :=
               build_full_ilist op4 [ r3' ] dest succ (fst ht3) [] map_consts
       | Iop (Oshrxlimm n, a1 :: nil, dest, succ) ->
           debug "Iop/Oshrxlimm";
           if Int.eq n Int.zero then exp := [ Iop (Omove, [ a1 ], dest, succ) ]
           else if Int.eq n Int.one then
             let n2 = n2pi () in
             let n1 = n2pi () in
             let r1 = r2pi () in
             let r2 = r2pi () in
             let op1 = Oshrluimm (Int.repr (Z.of_sint 63)) in
             let sv1 = find_or_addnmove op1 [ a1 ] r1 n1 map_consts true in
             let ht1 = build_head_tuple [] sv1 in
             let r1' = unzip_head_tuple ht1 r1 in

             let op2 = Oaddl in
             let sv2 = find_or_addnmove op2 [ a1; r1' ] r2 n2 map_consts true in
             let ht2 = build_head_tuple (fst ht1) sv2 in
             let r2' = unzip_head_tuple ht2 r2 in

             let op3 = Oshrlimm Int.one in
             exp :=
               build_full_ilist op3 [ r2' ] dest succ (fst ht2) [] map_consts
           else
             let n3 = n2pi () in
             let n2 = n2pi () in
             let n1 = n2pi () in
             let r1 = r2pi () in
             let r2 = r2pi () in
             let r3 = r2pi () in
             let op1 = Oshrlimm (Int.repr (Z.of_sint 63)) in
             let sv1 = find_or_addnmove op1 [ a1 ] r1 n1 map_consts true in
             let ht1 = build_head_tuple [] sv1 in
             let r1' = unzip_head_tuple ht1 r1 in

             let op2 = Oshrluimm (Int.sub Int64.iwordsize' n) in
             let sv2 = find_or_addnmove op2 [ r1' ] r2 n2 map_consts true in
             let ht2 = build_head_tuple (fst ht1) sv2 in
             let r2' = unzip_head_tuple ht2 r2 in

             let op3 = Oaddl in
             let sv3 = find_or_addnmove op3 [ a1; r2' ] r3 n3 map_consts true in
             let ht3 = build_head_tuple (fst ht2) sv3 in
             let r3' = unzip_head_tuple ht3 r3 in

             let op4 = Oshrlimm n in
             exp :=
               build_full_ilist op4 [ r3' ] dest succ (fst ht3) [] map_consts
       | _ -> ());
      if !was_exp then (
        (if !was_branch && List.length !exp > 1 then
         let lives = PTree.get n !liveins in
         match lives with
         | Some lives ->
             let new_branch_pc = n2p () in
             liveins := PTree.set new_branch_pc lives !liveins;
             liveins := PTree.remove n !liveins
         | _ -> ());
        write_pathmap sb.instructions.(0) (List.length !exp - 1) pm';
        write_tree !exp n !node code' new_order true)
      else new_order := n :: !new_order)
    sb.instructions;
  sb.instructions <- Array.of_list (List.rev !new_order);
  sb.liveins <- !liveins;
  (*debug_flag := false;*)
  (!code', !pm')

let rec find_last_node_reg = function
  | [] -> ()
  | (pc, i) :: k ->
      let rec traverse_list var = function
        | [] -> ()
        | e :: t ->
            let e' = p2i e in
            if e' > !var then var := e';
            traverse_list var t
      in
      traverse_list node [ pc ];
      traverse_list reg (get_regs_inst i);
      find_last_node_reg k