The simple type unification algorithm suffered from some serious performance and memory problems when used with certain code bases. This adds some crucial optimizations that improve performance drastically.
295 lines
11 KiB
Go
295 lines
11 KiB
Go
// Mgmt
|
|
// Copyright (C) 2013-2019+ James Shubin and the project contributors
|
|
// Written by James Shubin <james@shubin.ca> and the project contributors
|
|
//
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU General Public License
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
package interfaces
|
|
|
|
import (
|
|
"fmt"
|
|
"sort"
|
|
|
|
"github.com/purpleidea/mgmt/engine"
|
|
"github.com/purpleidea/mgmt/lang/types"
|
|
"github.com/purpleidea/mgmt/pgraph"
|
|
"github.com/purpleidea/mgmt/util/errwrap"
|
|
)
|
|
|
|
// Node represents either a Stmt or an Expr. It contains the minimum set of
|
|
// methods that they must both implement. In practice it is not used especially
|
|
// often since we usually know which kind of node we want.
|
|
type Node interface {
|
|
Apply(fn func(Node) error) error
|
|
//Parent() Node // TODO: should we implement this?
|
|
}
|
|
|
|
// Stmt represents a statement node in the language. A stmt could be a resource,
|
|
// a `bind` statement, or even an `if` statement. (Different from an `if`
|
|
// expression.)
|
|
type Stmt interface {
|
|
Node
|
|
fmt.Stringer // String() string
|
|
Init(*Data) error // initialize the populated node and validate
|
|
Interpolate() (Stmt, error) // return expanded form of AST as a new AST
|
|
SetScope(*Scope) error // set the scope here and propagate it downwards
|
|
Unify() ([]Invariant, error) // TODO: is this named correctly?
|
|
Graph() (*pgraph.Graph, error)
|
|
Output() (*Output, error)
|
|
}
|
|
|
|
// Expr represents an expression in the language. Expr implementations must have
|
|
// their method receivers implemented as pointer receivers so that they can be
|
|
// easily copied and moved around. Expr also implements pgraph.Vertex so that
|
|
// these can be stored as pointers in our graph data structure.
|
|
type Expr interface {
|
|
Node
|
|
//fmt.Stringer // already provided by pgraph.Vertex
|
|
pgraph.Vertex // must implement this since we store these in our graphs
|
|
Init(*Data) error // initialize the populated node and validate
|
|
Interpolate() (Expr, error) // return expanded form of AST as a new AST
|
|
SetScope(*Scope) error // set the scope here and propagate it downwards
|
|
SetType(*types.Type) error // sets the type definitively, errors if incompatible
|
|
Type() (*types.Type, error)
|
|
Unify() ([]Invariant, error) // TODO: is this named correctly?
|
|
Graph() (*pgraph.Graph, error)
|
|
Func() (Func, error) // a function that represents this reactively
|
|
SetValue(types.Value) error
|
|
Value() (types.Value, error)
|
|
}
|
|
|
|
// Data provides some data to the node that could be useful during its lifetime.
|
|
type Data struct {
|
|
// Fs represents a handle to the filesystem that we're running on. This
|
|
// is necessary for opening files if needed by import statements. The
|
|
// file() paths used to get templates or other files from our deploys
|
|
// come from here, this is *not* used to interact with the host file
|
|
// system to manage file resources or other aspects.
|
|
Fs engine.Fs
|
|
|
|
// Base directory (absolute path) that the running code is in. If an
|
|
// import is found, that's a recursive addition, and naturally for that
|
|
// run, this value would be different in the recursion.
|
|
Base string
|
|
|
|
// Files is a list of absolute paths seen so far. This includes all
|
|
// previously seen paths, where as the former Offsets parameter did not.
|
|
Files []string
|
|
|
|
// Imports stores a graph inside a vertex so we have a current cursor.
|
|
// This means that as we recurse through our import graph (hopefully a
|
|
// DAG) we can know what the parent vertex in our graph is to edge to.
|
|
// If we ever can't topologically sort it, then it has an import loop.
|
|
Imports *pgraph.SelfVertex
|
|
|
|
// Metadata is the metadata structure associated with the given parsing.
|
|
// It can be present, which is often the case when importing a module,
|
|
// or it can be nil, which is often the case when parsing a single file.
|
|
// When imports are nested (eg: an imported module imports another one)
|
|
// the metadata structure can recursively point to an earlier structure.
|
|
Metadata *Metadata
|
|
|
|
// Modules is an absolute path to a modules directory on the current Fs.
|
|
// It is the directory to use to look for remote modules if we haven't
|
|
// specified an alternative with the metadata Path field. This is
|
|
// usually initialized with the global modules path that can come from
|
|
// the cli or an environment variable, but this only occurs for the
|
|
// initial download/get operation, and obviously not once we're running
|
|
// a deploy, since by then everything in here would have been copied to
|
|
// the runtime fs.
|
|
Modules string
|
|
|
|
// Downloader is the interface that must be fulfilled to download
|
|
// modules. If a missing import is found, and this is not nil, then it
|
|
// will be run once in an attempt to get the missing module before it
|
|
// fails outright. In practice, it is recommended to separate this
|
|
// download phase in a separate step from the production running and
|
|
// deploys, however that is not blocked at the level of this interface.
|
|
Downloader Downloader
|
|
|
|
//World engine.World // TODO: do we need this?
|
|
|
|
// Prefix provides a unique path prefix that we can namespace in. It is
|
|
// currently shared identically across the whole AST. Nodes should be
|
|
// careful to not write on top of other nodes data.
|
|
Prefix string
|
|
|
|
// Debug represents if we're running in debug mode or not.
|
|
Debug bool
|
|
|
|
// Logf is a logger which should be used.
|
|
Logf func(format string, v ...interface{})
|
|
}
|
|
|
|
// Scope represents a mapping between a variables identifier and the
|
|
// corresponding expression it is bound to. Local scopes in this language exist
|
|
// and are formed by nesting within if statements. Child scopes can shadow
|
|
// variables in parent scopes, which is another way of saying they can redefine
|
|
// previously used variables as long as the new binding happens within a child
|
|
// scope. This is useful so that someone in the top scope can't prevent a child
|
|
// module from ever using that variable name again. It might be worth revisiting
|
|
// this point in the future if we find it adds even greater code safety. Please
|
|
// report any bugs you have written that would have been prevented by this. This
|
|
// also contains the currently available functions. They function similarly to
|
|
// the variables, and you can add new ones with a function statement definition.
|
|
// An interesting note about these is that they exist in a distinct namespace
|
|
// from the variables, which could actually contain lambda functions.
|
|
type Scope struct {
|
|
Variables map[string]Expr
|
|
Functions map[string]func() Func
|
|
Classes map[string]Stmt
|
|
|
|
Chain []Stmt // chain of previously seen stmt's
|
|
}
|
|
|
|
// EmptyScope returns the zero, empty value for the scope, with all the internal
|
|
// lists initialized appropriately.
|
|
func EmptyScope() *Scope {
|
|
return &Scope{
|
|
Variables: make(map[string]Expr),
|
|
Functions: make(map[string]func() Func),
|
|
Classes: make(map[string]Stmt),
|
|
Chain: []Stmt{},
|
|
}
|
|
}
|
|
|
|
// Copy makes a copy of the Scope struct. This ensures that if the internal map
|
|
// is changed, it doesn't affect other copies of the Scope. It does *not* copy
|
|
// or change the Expr pointers contained within, since these are references, and
|
|
// we need those to be consistently pointing to the same things after copying.
|
|
func (obj *Scope) Copy() *Scope {
|
|
variables := make(map[string]Expr)
|
|
functions := make(map[string]func() Func)
|
|
classes := make(map[string]Stmt)
|
|
chain := []Stmt{}
|
|
if obj != nil { // allow copying nil scopes
|
|
for k, v := range obj.Variables { // copy
|
|
variables[k] = v // we don't copy the expr's!
|
|
}
|
|
for k, v := range obj.Functions { // copy
|
|
functions[k] = v // we don't copy the generator func's
|
|
}
|
|
for k, v := range obj.Classes { // copy
|
|
classes[k] = v // we don't copy the StmtClass!
|
|
}
|
|
for _, x := range obj.Chain { // copy
|
|
chain = append(chain, x) // we don't copy the Stmt pointer!
|
|
}
|
|
}
|
|
return &Scope{
|
|
Variables: variables,
|
|
Functions: functions,
|
|
Classes: classes,
|
|
Chain: chain,
|
|
}
|
|
}
|
|
|
|
// Merge takes an existing scope and merges a scope on top of it. If any
|
|
// elements had to be overwritten, then the error result will contain some info.
|
|
// Even if this errors, the scope will have been merged successfully. The merge
|
|
// runs in a deterministic order so that errors will be consistent. Use Copy if
|
|
// you don't want to change this destructively.
|
|
// FIXME: this doesn't currently merge Chain's... Should it?
|
|
func (obj *Scope) Merge(scope *Scope) error {
|
|
var err error
|
|
// collect names so we can iterate in a deterministic order
|
|
namedVariables := []string{}
|
|
namedFunctions := []string{}
|
|
namedClasses := []string{}
|
|
for name := range scope.Variables {
|
|
namedVariables = append(namedVariables, name)
|
|
}
|
|
for name := range scope.Functions {
|
|
namedFunctions = append(namedFunctions, name)
|
|
}
|
|
for name := range scope.Classes {
|
|
namedClasses = append(namedClasses, name)
|
|
}
|
|
sort.Strings(namedVariables)
|
|
sort.Strings(namedFunctions)
|
|
sort.Strings(namedClasses)
|
|
|
|
for _, name := range namedVariables {
|
|
if _, exists := obj.Variables[name]; exists {
|
|
e := fmt.Errorf("variable `%s` was overwritten", name)
|
|
err = errwrap.Append(err, e)
|
|
}
|
|
obj.Variables[name] = scope.Variables[name]
|
|
}
|
|
for _, name := range namedFunctions {
|
|
if _, exists := obj.Functions[name]; exists {
|
|
e := fmt.Errorf("function `%s` was overwritten", name)
|
|
err = errwrap.Append(err, e)
|
|
}
|
|
obj.Functions[name] = scope.Functions[name]
|
|
}
|
|
for _, name := range namedClasses {
|
|
if _, exists := obj.Classes[name]; exists {
|
|
e := fmt.Errorf("class `%s` was overwritten", name)
|
|
err = errwrap.Append(err, e)
|
|
}
|
|
obj.Classes[name] = scope.Classes[name]
|
|
}
|
|
|
|
return err
|
|
}
|
|
|
|
// IsEmpty returns whether or not a scope is empty or not.
|
|
// FIXME: this doesn't currently consider Chain's... Should it?
|
|
func (obj *Scope) IsEmpty() bool {
|
|
//if obj == nil { // TODO: add me if this turns out to be useful
|
|
// return true
|
|
//}
|
|
if len(obj.Variables) > 0 {
|
|
return false
|
|
}
|
|
if len(obj.Functions) > 0 {
|
|
return false
|
|
}
|
|
if len(obj.Classes) > 0 {
|
|
return false
|
|
}
|
|
return true
|
|
}
|
|
|
|
// Edge is the data structure representing a compiled edge that is used in the
|
|
// lang to express a dependency between two resources and optionally send/recv.
|
|
type Edge struct {
|
|
Kind1 string // kind of resource
|
|
Name1 string // name of resource
|
|
Send string // name of field used for send/recv (optional)
|
|
|
|
Kind2 string // kind of resource
|
|
Name2 string // name of resource
|
|
Recv string // name of field used for send/recv (optional)
|
|
|
|
Notify bool // is there a notification being sent?
|
|
}
|
|
|
|
// Output is a collection of data returned by a Stmt.
|
|
type Output struct { // returned by Stmt
|
|
Resources []engine.Res
|
|
Edges []*Edge
|
|
//Exported []*Exports // TODO: add exported resources
|
|
}
|
|
|
|
// EmptyOutput returns the zero, empty value for the output, with all the
|
|
// internal lists initialized appropriately.
|
|
func EmptyOutput() *Output {
|
|
return &Output{
|
|
Resources: []engine.Res{},
|
|
Edges: []*Edge{},
|
|
}
|
|
}
|