BinaryAnalysisPlatform
diff --git a/‎.github/workflows/build-and-test.yml
+8-2 b/‎.github/workflows/build-and-test.yml
+8-2
diff --git a/‎.github/workflows/build-dev-repo.yml
-1 b/‎.github/workflows/build-dev-repo.yml
-1
diff --git a/‎.github/workflows/build-from-opam.yml
+9-3 b/‎.github/workflows/build-from-opam.yml
+9-3
diff --git a/‎.github/workflows/nightly-testing.yml
+7-12 b/‎.github/workflows/nightly-testing.yml
+7-12
diff --git a/‎.github/workflows/publish-docker-image.yml
+1-1 b/‎.github/workflows/publish-docker-image.yml
+1-1
diff --git a/‎.github/workflows/release.yml
+6 b/‎.github/workflows/release.yml
+6
diff --git a/‎docker/ubuntu/bionic/Dockerfile
+5-2 b/‎docker/ubuntu/bionic/Dockerfile
+5-2
diff --git a/‎lib/arm/arm_target.ml
+27-3 b/‎lib/arm/arm_target.ml
+27-3
diff --git a/‎lib/arm/arm_target.mli
+1-1 b/‎lib/arm/arm_target.mli
+1-1
diff --git a/‎lib/bap/bap.mli
+46 b/‎lib/bap/bap.mli
+46
diff --git a/‎lib/bap/bap_project.ml
+11-11 b/‎lib/bap/bap_project.ml
+11-11
diff --git a/‎lib/bap_core_theory/bap_core_theory.mli
+40-5 b/‎lib/bap_core_theory/bap_core_theory.mli
+40-5
@@ -6,7 +6,7 @@ on:
 
 jobs:
   build:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-18.04
 
     env:
       OPAMJOBS: 2
@@ -32,7 +32,13 @@ jobs:
         run: opam pin add bap . --no-action
 
       - name: Install system dependencies
-        run: opam depext -u bap
+        run: opam depext -u bap-extra
+
+      - name: Install Ghidra
+        run: |
+          sudo add-apt-repository ppa:ivg/ghidra -y
+          sudo apt-get install libghidra-dev -y
+          sudo apt-get install libghidra-data -y
 
       - name: Install opam dependencies
         run: |
 
@@ -43,7 +43,6 @@ jobs:
         if: matrix.os == 'macos-latest'
         run: |
           rm -rf /usr/local/bin/2to3
-          brew unlink gcc@8
           brew unlink gcc@9
           brew update
           brew upgrade
 
@@ -10,7 +10,7 @@ jobs:
           - 4.11.x
           - 4.08.x
 
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-18.04
 
     env:
       OPAMJOBS: 2
@@ -23,11 +23,17 @@ jobs:
           ocaml-compiler: ${{ matrix.ocaml-compiler }}
           dune-cache: true
 
+      - name: Install Ghidra
+        run: |
+          sudo add-apt-repository ppa:ivg/ghidra -y
+          sudo apt-get install libghidra-dev -y
+          sudo apt-get install libghidra-data -y
+
       - name: Add the testing Repository
         run: opam repo add bap git://github.com/BinaryAnalysisPlatform/opam-repository#testing
 
       - name: Install system dependencies
-        run: opam depext -u bap
+        run: opam depext -u bap-extra
 
       - name: Cleanup the Caches
         run: sudo apt clean --yes
@@ -36,7 +42,7 @@ jobs:
         run: df -h
 
       - name: Build and Install BAP Packages
-        run: opam clean -a; opam install bap
+        run: opam clean -a; opam install bap-extra
 
       - uses: actions/upload-artifact@v2
         if: ${{ always() }}
 
@@ -10,7 +10,7 @@ jobs:
     strategy:
       matrix:
         os:
-          - ubuntu-latest
+          - ubuntu-18.04
         ocaml-compiler:
           - 4.11.x
           - 4.08.x
@@ -29,30 +29,25 @@ jobs:
           dune-cache: true
           cache-prefix: nightly
 
-      - name: Configure Homebrew
-        if: matrix.os == 'macos-latest'
+      - name: Install Ghidra
         run: |
-          rm -rf /usr/local/bin/2to3
-          brew unlink gcc@8
-          brew unlink gcc@9
-          brew update
-          brew upgrade
-          echo 'LLVM_CONFIG=/usr/local/opt/llvm@9/bin/llvm-config' >> $GITHUB_ENV
+          sudo add-apt-repository ppa:ivg/ghidra -y
+          sudo apt-get install libghidra-dev -y
+          sudo apt-get install libghidra-data -y
 
       - name: Add the Testing Repository
         run: opam repo add bap git://github.com/BinaryAnalysisPlatform/opam-repository#testing
       - name: Install System Dependencies
-        run: opam depext -u bap
+        run: opam depext -u bap-extra
 
       - name: Install radare2 Dependencies
         run: opam depext -u bap-radare2
 
       - name: Cleanup the Caches
-        if: matrix.os == 'ubuntu-latest'
         run: sudo apt clean --yes
 
       - name: Build and Install BAP
-        run: opam install bap bap-radare2
+        run: opam install bap-extra bap-radare2
 
       - name: Checkout the Tests
         uses: actions/checkout@v2
 
@@ -21,4 +21,4 @@ jobs:
         with:
           push: true
           tags: binaryanalysisplatform/bap:latest
-          file: docker/ubuntu/xenial/Dockerfile
+          file: docker/ubuntu/bionic/Dockerfile
@@ -24,6 +24,12 @@ jobs:
           ocaml-compiler: ocaml-variants.4.11.2+flambda
           dune-cache: true
 
+      - name: Install Ghidra
+        run: |
+          sudo add-apt-repository ppa:ivg/ghidra -y
+          sudo apt-get install libghidra-dev -y
+          sudo apt-get install libghidra-data -y
+
       - name: Add the testing Repository
         run: opam repo add bap git://github.com/BinaryAnalysisPlatform/opam-repository#testing
       - name: Build deb packages
 
@@ -2,13 +2,16 @@ FROM ocaml/opam2:ubuntu-18.04
 
 WORKDIR /home/opam
 
-RUN sudo apt-get update  \
+RUN sudo add-apt-repository ppa:ivg/ghidra -y
+ && sudo apt-get install libghidra-dev -y
+ && sudo apt-get install libghidra-data -y
+ && sudo apt-get update  \
  && opam switch 4.09 \
  && eval "$(opam env)" \
  && opam remote set-url default https://opam.ocaml.org \
  && opam repo add bap git://github.com/BinaryAnalysisPlatform/opam-repository --all \
  && opam update \
- && opam depext --install bap --yes -j 1 \
+ && opam depext --install bap-extra --yes -j 1 \
  && opam clean -acrs \
  && rm -rf /home/opam/.opam/4.0[2-8,10] \
  && rm -rf /home/opam/.opam/4.09/.opam-switch/sources/* \
 
@@ -384,6 +384,7 @@ let enable_arch () =
 let llvm_a32 = CT.Language.declare ~package "llvm-armv7"
 let llvm_t32 = CT.Language.declare ~package "llvm-thumb"
 let llvm_a64 = CT.Language.declare ~package "llvm-aarch64"
+let pcode = CT.Language.declare ~package "pcode-arm"
 
 module Dis = Disasm_expert.Basic
 
@@ -459,6 +460,27 @@ let before_thumb2 t = t < LE.v6t2 || t < EB.v6t2
 let is_64bit t = LE.v8a <= t || EB.v8a <= t || Bi.v8a <= t
 let is_thumb_only t = LE.v7m <= t || EB.v7m <= t || Bi.v7m <= t
 
+let is_big t = Theory.Target.endianness t = Theory.Endianness.eb
+let is_little t = Theory.Target.endianness t = Theory.Endianness.le
+
+let register_pcode () =
+  Dis.register pcode @@ fun t ->
+  let triple = match is_64bit t,is_little t,is_big t with
+    | true,true,_ -> "ARM:LE:32:v8"
+    | true,_,true -> "ARM:BE:32:v8"
+    | true,_,_    -> "ARM:LEBE:32:v8LEInstruction"
+    | false,true,_ -> "ARM:LE:32:v7"
+    | false,_,true -> "ARM:BE:32:v7"
+    | false,_,_    -> "ARM:LEBE:32:v7LEInstruction" in
+  Dis.create ~backend:"ghidra" triple
+
+let enable_pcode () =
+  register_pcode ();
+  KB.promise Theory.Label.encoding @@ fun label ->
+  Theory.Label.target label >>| fun t ->
+  if is_arm t then pcode
+  else Theory.Language.unknown
+
 let guess_encoding interworking label target =
   if is_arm target then
     if is_64bit target then !!llvm_a64 else
@@ -472,7 +494,7 @@ let guess_encoding interworking label target =
         | false -> !!llvm_a32
   else !!CT.Language.unknown
 
-let enable_decoder ?interworking () =
+let enable_llvm ?interworking () =
   let open KB.Syntax in
   register llvm_a32 "armv7";
   register llvm_t32 "thumbv7" ~attrs:"+thumb2";
@@ -481,7 +503,9 @@ let enable_decoder ?interworking () =
   CT.Label.target label >>= guess_encoding interworking label
 
 
-let load ?interworking () =
+let load ?interworking ?(backend="llvm") () =
   enable_loader ();
   enable_arch ();
-  enable_decoder ?interworking ()
+  if String.equal backend "llvm"
+  then enable_llvm ?interworking ()
+  else enable_pcode ()
@@ -115,4 +115,4 @@ val llvm_a64 : Theory.language
     a symbol there with an odd address (which is used to indicate
     thumb encoding) then interworking is enabled.
 *)
-val load : ?interworking:bool -> unit -> unit
+val load : ?interworking:bool -> ?backend:string -> unit -> unit
@@ -2412,6 +2412,18 @@ module Std : sig
     val intrinsic: string Attribute.t
 
 
+    (** [label] a named code location.
+
+        @since 2.4.0  *)
+    val label : string Attribute.t
+
+
+    (** [goto] represents a control-flow transfer to a named label.
+
+        @since 2.4.0 *)
+    val goto : string Attribute.t
+
+
     (** Core Theory specification of BIL.  *)
     module Theory : sig
 
@@ -6976,6 +6988,40 @@ module Std : sig
         by evaluating in many languages, e.g. Python, Js, etc *)
     val pp_adt : Format.formatter -> t -> unit
 
+
+    (** Subinstruction Sequence Number.
+
+        A subinstruction sequence number plays the role of an address
+        for sub-instruction (which otherwise share the same physical
+        address).
+
+        Each subinstruction is having a unique address across the
+        whole program (not only unique across to other subinstructions
+        of the same instruction) and much like [Theory.Label.for_addr]
+        it is possible to get a label that corresponds to an
+        instruction with the given sequence number using
+        [Seqnum.label].
+
+        The sequence number is represented with an integer to enable
+        address arithemetics. A subinstruction that follows a
+        subinstruction with the sequence number [N] has the sequence
+        number [N+1].
+
+        @since 2.4.0
+    *)
+    module Seqnum : sig
+      type t = int
+
+
+      (** [label seqnum] returns the program label that corresponds
+          to [seqnum].  *)
+      val label : ?package:string -> t -> Theory.Label.t KB.t
+
+      (** [slot] for accessing the sequence number of a subinstruction.  *)
+      val slot : (Theory.program, t option) KB.slot
+    end
+
+
     (** {3 Prefix Tree}
         This module provides a trie data structure where a sequence of
         instructions is used as a key (and an individual instruction
 
@@ -39,22 +39,22 @@ let memory_slot = KB.Class.property Theory.Unit.cls "unit-memory"
     ~desc:"annotated memory regions of the unit"
     Memmap.domain
 
-let with_filename spec target code memory path =
+let with_filename spec target _code memory path f =
   let open KB.Syntax in
   let width = Theory.Target.code_addr_size target in
   let bias = query spec Image.Scheme.bias |> Option.map
                ~f:(fun x -> Bitvec.(int64 x mod modulus width)) in
+  Theory.Unit.for_file path >>= fun unit ->
+  KB.sequence [
+    KB.provide Image.Spec.slot unit spec;
+    KB.provide Theory.Unit.bias unit bias;
+    KB.provide Theory.Unit.target unit target;
+    KB.provide Image.Spec.slot unit spec;
+    KB.provide Theory.Unit.path unit (Some path);
+    KB.provide memory_slot unit memory;
+  ] >>= fun () ->
   KB.promising Theory.Label.unit ~promise:(fun _ ->
-      Theory.Unit.for_file path >>= fun unit ->
-      KB.sequence [
-        KB.provide Image.Spec.slot unit spec;
-        KB.provide Theory.Unit.bias unit bias;
-        KB.provide Theory.Unit.target unit target;
-        KB.provide Image.Spec.slot unit spec;
-        KB.provide Theory.Unit.path unit (Some path);
-        KB.provide memory_slot unit memory;
-      ] >>| fun () ->
-      Some unit)
+      !!(Some unit)) f
 
 
 module State = struct
 
@@ -138,11 +138,12 @@
     be bound to expressions. Sometimes variables are typed, sometimes
     they are just identifiers with not associated type.
 
-    In the Core Theory all variables are sorted, i.e., the have an
-    associated value sort. Variables are also having scope and
-    extent. Finally, variables could be mutable or immutable.
+    In the Core Theory all variables are sorted, i.e., they have an
+    associated value sort. Variables are also having scope (lexical
+    visibility), and extent (lifetime) Finally, variables could be
+    mutable or immutable.
 
-    A physical variable is a global mutable variable with infinite
+    A physical variable is a global mutable variable with the infinite
     scope and extent. They are used to refer predefined (micro)
     architectural locations of a modeled system, e.g., registers,
     memory banks, caches, register files, etc. Global variables has
@@ -778,6 +779,10 @@ module Theory : sig
           Since such structures are required to be monomorphic, the
           sort type index should be removed using the [forget] function,
           before a sort could be stored in it.
+
+          Note, that the type index is only removed from the meta
+          language (OCaml) type, but is preserved in the value term,
+          so it could be reconstructed (refined) later.
       *)
       module Top : sig
         type t = unit sort [@@deriving bin_io, compare, sexp]
@@ -1080,7 +1085,9 @@ module Theory : sig
   *)
   module Var : sig
     type 'a t
+
     type ident [@@deriving bin_io, compare, sexp]
+
     type ord
 
 
@@ -1161,7 +1168,21 @@ module Theory : sig
         @since 2.3.0  *)
     val pp : Format.formatter -> 'a t -> unit
 
-    (** Variable identifiers.  *)
+    (** Variable identifiers.
+
+        Identifiers are compared caseless, otherwise the order loosely
+        matches the lexicographical order of the textual
+        representation. Identifiers of virtual variables are ordered
+        before identifiers of physical variables and mutable virtual
+        variables are ordered before immutable. Identifiers of a
+        versioned variable are ordered in the ascending order of their
+        versions. And identifiers of virtual variables are ordered in
+        the ascending order of their numeric values, e.g., `#2`
+        is ordered before `#123`.
+
+        @before 2.4.0 the ordering was unspecified but wasn't caseless.
+        @since 2.4.0 the ordering is caseless
+    *)
     module Ident : sig
       type t = ident [@@deriving bin_io, compare, sexp]
       include Stringable.S with type t := t
@@ -1174,6 +1195,10 @@ module Theory : sig
 
         This module enables construction of complex data structures on
         variables, e.g., [Set.empty (module Theory.Var.Top)].
+
+        The variables are ordered by their identifiers so that two
+        variables with the same name but different sorts are compared
+        equal.
     *)
     module Top : sig
       type nonrec t = unit t [@@deriving bin_io, compare, sexp]
@@ -1782,6 +1807,16 @@ module Theory : sig
     val is_subroutine : (program, bool option) KB.slot
 
 
+    (** [fresh] a fresh label (a shortcut for [KB.create cls]).
+
+        @since 2.4.0   *)
+    val fresh : t knowledge
+
+    (** [null] is a shortcut for [KB.null cls].
+
+        @since 2.4.0  *)
+    val null : t
+
     (** [for_addr x] generates a link to address [x].
 
         It is guaranteed that every call [for_addr ~package x] with