lh-l4v/camkes/adl-spec/Types_CAMKES.thy

(*
 * Copyright 2020, Data61, CSIRO (ABN 41 687 119 230)
 *
 * SPDX-License-Identifier: GPL-2.0-only
 *)

chapter \<open>\label{sec:types}Types\<close>

(*<*)
theory Types_CAMKES
imports
  Access.Access
begin
(*>*)

text \<open>
  This section describes the types of entities that appear in the CAmkES
  Interface Definition Language (IDL) and Architecture Description Language
  (ADL). The model assumes that all syntactic elements are available in a single
  environment; that is, all @{term import} inclusion statements have already
  been processed and all references are to be resolved within this context.
\<close>

subsection \<open>\label{subsec:symbols}Symbols\<close>
text \<open>
  CAmkES has two types of symbols that exist in separate namespaces. Symbols of
  the first type are used in IDL descriptions to identify method names and
  parameters. These symbols are used during code generation and therefore need
  to be distinct within a specific interface.
\<close>
type_synonym idl_symbol = string

text \<open>
  The second type of symbols are used in ADL descriptions to identify components,
  connectors and other architecture-level entities. These symbols are also used
  during code generation, but are lexically scoped. E.g. Instantiated interfaces
  within separate components can have an identical name.
\<close>
type_synonym adl_symbol = string

text \<open>
  Although both symbols map to the same underlying type, these have different
  constraints (e.g. IDL symbols become direct substrings of code-level symbols
  and hence need to respect symbol naming restrictions for the target
  language(s)).
\<close>

subsection \<open>\label{subsec:methods}Methods\<close>
text \<open>
  Methods are the elements that make up a CAmkES procedure (described below).
  Each method within a CAmkES procedure has a list of parameters defined by a
  type, direction and symbol name. Each method also has an optional return
  value type. The valid types for method parameters and return values include
  a set of high level types designed to abstract the types available in a
  general programming language. By using only these types in a procedure
  description, the interface can be implemented in any valid target language.

  In high-level languages, arrays may have attached size information, while in
  C this information is passed as an extra parameter to their containing
  method. Arrays are parameterised with the underlying type of
  their elements. Similar to primitive types, using a high-level type for the
  elementary type of an array allows it to be implemented or used in any
  component, while using a C-specific type prevents implementing or using it in
  a component not written in C. Arrays of arrays and multidimensional arrays are
  not supported.

  We also support talking about arbitrary C types. These include fixed-width
  integers, floats, structs, etc. For these types, our model just passes their
  names around and they are expected to behave as simple value types
  (without embedded pointers).
\<close>

datatype number =
    \<comment> \<open>High level types\<close>
    UnsignedInteger
  | Integer
  | Real
  | Boolean

datatype textual =
    \<comment> \<open>High level types\<close>
    Character
  | String
    \<comment> \<open>C-specific types\<close>
  | char

datatype primitive =
    Numerical number
  | Textual textual

datatype array =
    SizedArray primitive
  | TerminatedArray primitive

datatype param_type =
    Primitive primitive
  | Array array
  | CType string

text \<open>
  Rather than having a single return value per procedure method, each
  method parameter can be an input parameter, an output parameter, or both.
\<close>
datatype param_direction =
    InParameter (* also covers 'refin' *)
  | OutParameter
  | InOutParameter

text \<open>
  Each procedure comprises a collection of methods that each have an
  optional return type,
  identifier and a list of parameters. Each parameter has a type and an
  identifier.
\<close>
record parameter =
  p_type        :: param_type
  p_direction   :: param_direction
  p_name        :: idl_symbol

record "method" =
  m_return_type :: "param_type option"
  m_name        :: idl_symbol
  m_parameters  :: "parameter list"
text \<open>
  The translation from procedure methods in IDL to their representation in
  Isabelle is straightforward. The CAmkES method

\begin{verbatim}
  int foo(in string s);
\end{verbatim}

  is translated to the Isabelle representation
\<close>
(*<*)value(*>*)
  "\<lparr>m_return_type = Some (Primitive (Numerical Integer)),
    m_name = ''foo'',
    m_parameters = [
      \<lparr>p_type = Primitive (Textual String),
       p_direction = InParameter,
       p_name = ''s''\<rparr>
    ]\<rparr>"
text \<open>
  More examples are given in \autoref{sec:examples}.
\<close>

subsection \<open>\label{subsec:interfaces}Interfaces\<close>
text \<open>
  Connections between two components are made from one interface to another.
  CAmkES distinguishes between
  interfaces that consist of a list of function calls and interfaces
  that have other patterns of interaction.

  There are three basic types of supported interfaces. The first, @{text procedure},
  is used for modelling traditional caller-callee semantics of interaction. The
  second, @{text event}, is used for asynchronous notifications such as interrupts.
  Finally, @{text dataport}, is used to model shared memory communication.
\<close>
type_synonym procedure = "method list"
type_synonym event     = nat \<comment> \<open>ID\<close>
type_synonym dataport  = "string option" \<comment> \<open>type\<close>
datatype interface =
    Procedure procedure
  | Event event
  | Dataport dataport

subsection \<open>\label{subsec:connectors}Connectors\<close>
text \<open>
  Two components are connected via a connector. The type of a connector
  comprises two orthogonal features:

  \begin{itemize}
    \item The kind of components being connected: @{text connector_endpoint}
    \item The communication mechanism: @{text connector_mechanism}
  \end{itemize}
\<close>

text \<open>
  Connector types.

  Native connectors are used for ordinary communication between software
  components; these are found in almost all component platform models.

  Hardware devices are also modelled as components in CAmkES.
  Hardware connectors are used to connect the interface of a device to
  the interface of a software component (typically, a driver).

  Export connectors are used when
  specifying a compound component. A compound component has a set of interfaces
  that are a subset of the unconnected interfaces of its constituent components.
  The exposed interfaces of the compound component are defined by using export
  connectors to map these to the interfaces of the internal components.

  Export connectors are purely an architectural-level entity and do not exist at
  runtime. During code generation connections through exported interfaces are
  flattened. That is, a connection from interface A to exported interface B that
  exports interface C is instantiated as a connection from interface A to interface
  C would be. They can be thought of as a design-level convenience.

  \begin{figure}[h]
  \begin{center}
  \caption{\label{fig:export}An export connector}
  \includegraphics{imgs/composite-passthrough}
  \end{center}
  \end{figure}

  (Our model does not support compound components yet, but we may add support
   in the future. See \ref{subsubsec:composites} for more exposition.)
\<close>
datatype connector_type =
    NativeConnector
  | HardwareConnector
  | ExportConnector

text \<open>
  Connector interfaces.

  Each connector is declared to bind to a certain type of interface
  on its component endpoints. This also determines the interface
  exposed to user code.
\<close>
datatype connector_interface =
    RPCInterface
  | EventInterface
  | DataportInterface

text \<open>
  Connector access rights.

  This declares the types of access rights that may be made available
  by the connector. There are two sets of rights, corresponding to
  each nominal direction of the connector.

  Note that we will model connections to have separate access-control
  labels from components'. Hence we need \emph{six} sets: two for
  component rights to the connection objects (e.g. endpoints), and
  four for component rights to each other's objects.
\<close>
record connector_access =
    \<comment> \<open>@{text access_foo_bar} means access from the "@{text foo}" label to
        the "@{text bar}" label; labels may be from-components,
        to-components, or the connection itself\<close>
    access_from_to :: "auth set"
    access_to_from :: "auth set"

    \<comment> \<open>It might seem that components on the same side of a connection
        should not need access rights to each other.
        However, these auths are needed in more complicated systems,
        to work around bugs like VER-1108 and to express non-standard
        connector semantics such as VirtQueues.\<close>
    access_from_from :: "auth set"
    access_to_to :: "auth set"

    \<comment> \<open>we assume connections are passive labels, so they do not
        need access rights of their own\<close>
    access_from_conn :: "auth set"
    access_to_conn :: "auth set"

record connector =
    connector_type :: connector_type
    connector_interface :: connector_interface
    connector_access :: connector_access

subsection \<open>\label{subsec:components}Components\<close>
text \<open>
  Functional entities in a CAmkES system are represented as components. These
  are re-usable collections of source code with explicit descriptions of the
  exposed methods of interaction (@{term interfaces} described above).

  Components have three distinct interfaces for communication:
  \begin{enumerate}
    \item Synchronous communication over procedures. This communication is
      analogous to a function call and happens over a channel established from
      a @{text requires} interface to a @{text provides} interface.
    \item Asynchronous communication using events. This is suitable for things
      like interrupts and happens over a channel from an @{text emits} interface to
      a @{text consumes} interface.
    \item Bidirectional communication via shared memory. This is suitable for
      passing large data between components. It happens over a channel between
      two @{text dataports}.
  \end{enumerate}
\<close>
datatype InterfaceRequired = InterfaceRequired | InterfaceOptional

record component =
  control     :: bool
  hardware    :: bool
  requires    :: "(adl_symbol \<times> (InterfaceRequired \<times> procedure)) list"
  provides    :: "(adl_symbol \<times> procedure) list"
  dataports   :: "(adl_symbol \<times> dataport) list"
  emits       :: "(adl_symbol \<times> event) list"
  consumes    :: "(adl_symbol \<times> (InterfaceRequired \<times> event)) list"
  attributes  :: "(adl_symbol \<times> param_type) list"

subsection \<open>\label{subsec:assembling}Assembling a System\<close>
text \<open>
  A complete system is formed by instantiating component types that have been
  defined, interconnecting these instances and specifying a system
  configuration. Connections are specified by the two interfaces they connect
  and the communication mechanism in use.
\<close>
record connection =
  conn_type   :: connector
  conn_from   :: "(adl_symbol \<times> adl_symbol) list"
  conn_to     :: "(adl_symbol \<times> adl_symbol) list"

text \<open>
  A composition block is used to contain all components of the system and the
  connections that define their communication with each other.

  Additionally, it records which components are defined in a CAmkES
  @{text group} block. These components share a single address space
  and must also share the same access-control label.
  For more information, see the CAmkES documentation for groups.
\<close>
record composition =
  components  :: "(adl_symbol \<times> component) list"
  connections :: "(adl_symbol \<times> connection) list"
  group_labels :: "(adl_symbol \<times> adl_symbol) list" \<comment> \<open>See @{text get_group_label}, below\<close>

text \<open>
  Get the access-control label for a component or connection, taking
  groups into account. ADL names that are not part of groups are
  assumed to have their own labels.
\<close>
definition
  get_group_label :: "composition \<Rightarrow> adl_symbol \<Rightarrow> adl_symbol"
where
  "get_group_label spec c \<equiv>
     case map_of (group_labels spec) c of
         Some c' \<Rightarrow> c'
       | None \<Rightarrow> c"

text \<open>
  Configurations are used as a way of adding extra information to a component
  or specialising the component in a particular context. The attributes
  available to set are specified in the definition of the component, as
  indicated above. These attributes are accessible to the component at the
  code level at runtime.
\<close>
type_synonym configuration =
  "(adl_symbol \<times> adl_symbol \<times> string) list"

text \<open>
  Finally the system specification is expressed at the top level as an
  assembly. This extra level of abstraction allows more flexible re-use of
  compositions and configurations.
\<close>
record assembly =
  composition   :: "composition"
  configuration :: "configuration option"
  \<comment> \<open>This lets us shove extra policy edges into the generated integrity policy\<close>
  policy_extra  :: "(adl_symbol \<times> auth \<times> adl_symbol) set"

subsection \<open>\label{subsec:future}Future Work\<close>
subsubsection \<open>\label{subsubsec:composites}Component Hierarchy\<close>
text \<open>
  Some component platforms support the notion of explicit composite components.
  This allows a composition of components to be re-used as a component itself.
  In the context of the model presented above, this would allow a
  @{term composition} element to appear anywhere a @{term component} element
  is expected. Flexibility like this is desirable to avoid repeatedly
  constructing common design patterns involving fine grained components. There
  are plans to extend CAmkES to add this functionality.
\<close>

subsubsection \<open>\label{subsubsec:iarrays}Interface Arrays\<close>
text \<open>
  When specifying a more complicated dynamic component, it can be desirable to
  define an array of interfaces. For example, a component that
  provides an arbitrary number of copies of a specified procedure. This would
  be implemented by the size of the array (the number of such copies) being
  made available to the component at runtime and an index being provided with
  each procedure method invocation. An example of how this could be useful is
  discussed in \autoref{subsec:terminal}.

  Extending this further, allowing the specification of interface arrays that
  can be resized at runtime, by adding or removing connections, enables even
  greater flexibility. Supporting this kind of dynamism in a system requires
  meta functions (for modifying the interface array) and introduces further
  complexity in handling failures of these.
\<close>

(*<*)end(*>*)