Commit aca27394 authored by Eric Myhre's avatar Eric Myhre

First pass on generation for kinded unions.

So far, the generation itself runs, but the result will not yet compile.
I just want a checkpoint here.  (Most of this was written a few days ago already.)
parent d70a19d6
package gengo
import (
var _ TypeGenerator = &unionReprKindedGenerator{}
// Kinded union representations are quite wild: their behavior varies almost completely per inhabitant,
// and their implementation is generally delegating directly to something else,
// rather than having an intermediate node (like most unions do, and like the type-level view of this same value will).
// This also means any error values can be a little weird:
// sometimes they'll have the union's type name, but sometimes they'll have the inhabitant's type name instead;
// this depends on whether the error is an ErrWrongKind that was found while checking the method for appropriateness on the union's inhabitant
// versus if the error came from the union inhabitant itself after delegation occured.
func NewUnionReprKindedGenerator(pkgName string, typ *schema.TypeUnion, adjCfg *AdjunctCfg) TypeGenerator {
return unionReprKindedGenerator{
type unionReprKindedGenerator struct {
func (g unionReprKindedGenerator) GetRepresentationNodeGen() NodeGenerator {
return unionReprKindedReprGenerator{
type unionReprKindedReprGenerator struct {
// Note that there's no MapTraits (or any other FooTraits) mixin in this one!
// This is no accident: *None* of them apply!
AdjCfg *AdjunctCfg
PkgName string
Type *schema.TypeUnion
func (unionReprKindedReprGenerator) IsRepr() bool { return true } // hint used in some generalized templates.
func (g unionReprKindedReprGenerator) EmitNodeType(w io.Writer) {
// The type is structurally the same, but will have a different set of methods.
type _{{ .Type | TypeSymbol }}__Repr _{{ .Type | TypeSymbol }}
`, w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeTypeAssertions(w io.Writer) {
var _ ipld.Node = &_{{ .Type | TypeSymbol }}__Repr{}
`, w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodReprKind(w io.Writer) {
// FIXME wow
// A bunch of these methods could be improved by doing a gen-time switch for whether any of the possible members are the relevant kind at all;
// currently in the cases where there's no relevant members, we generate switch blocks that are empty except for their default...
// which works, but is arguably a little strange.
// I haven't checked if this dummy switch has any actual performance implications:
// I haven't tested if this produces unconditional assembly,
// nor if it successfully removes the access of the tag,
// though one might imagine a sufficiently clever compiler ought to do both of those things.
// Regardless, the gsloc is reducable. (Slightly. There are also bigger gains to be made elsewhere, I'm sure.)
func kindedUnionNodeMethodTemplateMunge(
methodSig string, condClause string, retClause string,
) string {
// We really could just... call the methods directly (and elide the switch entirely all the time), in the case of the "interface" implementation strategy.
// We don't, though, because that would deprive us of getting the union type's name in the wrong-kind errors...
// and in addition to that being sadface in general, it would be downright unacceptable if that behavior varied based on implementation strategy.
return `
func (n *_{{ .Type | TypeSymbol }}__Repr) ` + methodSig + ` {
{{- if (eq (.AdjCfg.UnionMemlayout .Type) "embedAll") }}
switch n.tag {
{{- range $i, $member := .Type.Members }}
` + condClause + `
case {{ add $i 1 }}:
return n.x{{ add $i 1 }}.Representation()` + retClause + `
{{- end}}
{{- end}}
{{- else if (eq (.AdjCfg.UnionMemlayout .Type) "interface") }}
switch n2 := n.x.(type) {
{{- range $i, $member := .Type.Members }}
` + condClause + `
case {{ $member | TypeSymbol }}:
return n2.Representation()` + retClause + `
{{- end}}
{{- end}}
{{- end}}
return nil, ipld.ErrWrongKind{doozy} // ... is this a good example of where ErrFoo.TypeName should indeed be freetext, so it can say "ThisUnion.Repr(inhabitant not FooMap)" ...?
// TODO damnit I need the method name again for error messages. ... maybe make the error be a clause, hm.
func (g unionReprKindedReprGenerator) EmitNodeMethodLookupByString(w io.Writer) {
`LookupByString(key string) (ipld.Node, error)`,
`{{- if eq $member.RepresentationBehavior.String "map" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodLookupByIndex(w io.Writer) {
`LookupByIndex(idx int) (ipld.Node, error)`,
`{{- if eq $member.RepresentationBehavior.String "list" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodLookupByNode(w io.Writer) {
`LookupByNode(key ipld.Node) (ipld.Node, error)`,
`{{- if or (eq $member.RepresentationBehavior.String "map") (eq $member.RepresentationBehavior.String "list") }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodLookupBySegment(w io.Writer) {
`LookupBySegment(seg ipld.PathSegment) (ipld.Node, error)`,
`{{- if or (eq $member.RepresentationBehavior.String "map") (eq $member.RepresentationBehavior.String "list") }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodMapIterator(w io.Writer) {
`MapIterator() ipld.MapIterator`,
`{{- if eq $member.RepresentationBehavior.String "map" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodListIterator(w io.Writer) {
`ListIterator() ipld.ListIterator`,
`{{- if eq $member.RepresentationBehavior.String "list" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodLength(w io.Writer) {
`Length() int`,
`{{- if or (eq $member.RepresentationBehavior.String "map") (eq $member.RepresentationBehavior.String "list") }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodIsAbsent(w io.Writer) {
func (n *_{{ .Type | TypeSymbol }}__Repr) IsAbsent() bool {
return false
`, w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodIsNull(w io.Writer) {
func (n *_{{ .Type | TypeSymbol }}__Repr) IsNull() bool {
return false
`, w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodAsBool(w io.Writer) {
`AsBool() (bool, error)`,
`{{- if eq $member.RepresentationBehavior.String "bool" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodAsInt(w io.Writer) {
`AsInt() (int, error)`,
`{{- if eq $member.RepresentationBehavior.String "int" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodAsFloat(w io.Writer) {
`AsFloat() (float64, error)`,
`{{- if eq $member.RepresentationBehavior.String "float" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodAsString(w io.Writer) {
`AsString() (string, error)`,
`{{- if eq $member.RepresentationBehavior.String "string" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodAsBytes(w io.Writer) {
`AsBytes() ([]byte, error)`,
`{{- if eq $member.RepresentationBehavior.String "bytes" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodAsLink(w io.Writer) {
`AsLink() (ipld.Link, error)`,
`{{- if eq $member.RepresentationBehavior.String "link" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodeMethodPrototype(w io.Writer) {
emitNodeMethodPrototype_typical(w, g.AdjCfg, g)
func (g unionReprKindedReprGenerator) EmitNodePrototypeType(w io.Writer) {
emitNodePrototypeType_typical(w, g.AdjCfg, g)
// --- NodeBuilder and NodeAssembler --->
func (g unionReprKindedReprGenerator) GetNodeBuilderGenerator() NodeBuilderGenerator {
return unionReprKindedReprBuilderGenerator{
type unionReprKindedReprBuilderGenerator struct {
AdjCfg *AdjunctCfg
PkgName string
Type *schema.TypeUnion
func (unionReprKindedReprBuilderGenerator) IsRepr() bool { return true } // hint used in some generalized templates.
func (g unionReprKindedReprBuilderGenerator) EmitNodeBuilderType(w io.Writer) {
emitEmitNodeBuilderType_typical(w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeBuilderMethods(w io.Writer) {
emitNodeBuilderMethods_typical(w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerType(w io.Writer) {
// Much of this is familiar: the 'w', the 'm' are all as usual.
// Some things may look a little odd here compared to all other assemblers:
// we're kinda halfway between what's conventionally seen for a scalar and what's conventionally seen for a recursive.
// There's no 'maState' or 'laState'-typed fields (which feels like a scalar) because even if we end up acting like a map or list, that state is in the relevant child assembler.
// We don't even have a 'cm' field, because we can get away with something really funky: we can just copy our own 'm' _pointer_ into children; our doneness and their doneness is the same.
// We never have to worry about maybeism of our children; the nullable and optional modifiers aren't possible on union members.
// (We *do* still have to consider null values though, as null is still a kind, and thus can be routed to one of our members!)
// 'ca' is as it is in the type-level assembler: technically, not super necessary, except that it allows minimizing the amount of work that resetting needs to do.
type _{{ .Type | TypeSymbol }}__ReprAssembler struct {
w *_{{ .Type | TypeSymbol }}
m *schema.Maybe
{{- range $i, $member := .Type.Members }}
ca{{ add $i 1 }} {{ if (eq (dot.AdjCfg.UnionMemlayout dot.Type) "interface") }}*{{end}}_{{ $member | TypeSymbol }}__ReprAssembler
{{end -}}
ca uint
`, w, g.AdjCfg, g)
func (na *_{{ .Type | TypeSymbol }}__ReprAssembler) reset() {
na.state = maState_initial
switch {
case 0:
{{- range $i, $member := .Type.Members }}
case {{ add $i 1 }}:{{ add $i 1 }}.reset()
{{end -}}
`, w, g.AdjCfg, g)
func kindedUnionNodeAssemblerMethodTemplateMunge(
methodSig string, condClause string, retClause string,
) string {
// The value pointed to by `na.m` isn't modified here, because we're sharing it with the child, who should do so.
// This also means that value gets checked twice -- once by us, because we need to halt if we've already been used --
// and also a second time by the child when we delegate to it, which, unbeknownst to it, is irrelevant.
// I don't see a good way to remedy this shy of making more granular (unexported!) methods. (Might be worth it.)
// This probably also isn't the same for all of the assembler methods: the methods we delegate to aren't doing as many check branches when they're for scalars,
// because they expected to be used in contexts where many values of the 'm' enum aren't reachable -- an expectation we've suddenly subverted with this path!
return `
func (na *_{{ .Type | TypeSymbol }}__ReprAssembler) ` + methodSig + ` {
switch *na.m {
case schema.Maybe_Value, schema.Maybe_Null:
panic("invalid state: cannot assign into assembler that's already finished")
case midvalue:
panic("invalid state: cannot assign into assembler that's already working on a larger structure!")
{{- range $i, $member := .Type.Members }}
` + condClause + `
{{- if dot.Type | MaybeUsesPtr }}
if na.w == nil {
na.w = &_{{ dot.Type | TypeSymbol }}{}
{{- end}} = {{ add $i 1 }}
{{- if (eq (dot.AdjCfg.UnionMemlayout dot.Type) "embedAll") }}
na.w.tag = {{ add $i 1 }}{{ add $i 1 }}.w = &na.w.x{{ add $i 1 }}{{ add $i 1 }}.m = na.m
return{{ add $i 1 }}.BeginMap(sizeHint)
{{- else if (eq (dot.AdjCfg.UnionMemlayout dot.Type) "interface") }}
x := &_{{ $member | TypeSymbol }}{}
na.w.x = x
if{{ add $i 1 }} == nil {{{ add $i 1 }} = &_{{ $member | TypeSymbol }}__ReprAssembler{}
}{{ add $i 1 }}.w = x{{ add $i 1 }}.m = na.m
return{{ add $i 1 }}` + retClause + `
{{- end}}
{{- end}}
{{- end}}
// TODO i think you finally Need a method for if-no-members-match-this-kind for the default rejection to compile this time.
return nil, ipld.ErrWrongKind{doozy}
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodBeginMap(w io.Writer) {
`BeginMap(sizeHint int) (ipld.MapAssembler, error)`,
`{{- if eq $member.RepresentationBehavior.String "map" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodBeginList(w io.Writer) {
`BeginList(sizeHint int) (ipld.ListAssembler, error)`,
`{{- if eq $member.RepresentationBehavior.String "list" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodAssignNull(w io.Writer) {
// TODO: I think this may need some special handling to account for if our union is itself used in a nullable circumstance; that should overrule this behavior.
`AssignNull() error `,
`{{- if eq $member.RepresentationBehavior.String "null" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodAssignBool(w io.Writer) {
`AssignBool(v bool) error `,
`{{- if eq $member.RepresentationBehavior.String "bool" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodAssignInt(w io.Writer) {
`AssignInt(v int) error `,
`{{- if eq $member.RepresentationBehavior.String "int" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodAssignFloat(w io.Writer) {
`AssignFloat(v float64) error `,
`{{- if eq $member.RepresentationBehavior.String "float" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodAssignString(w io.Writer) {
`AssignString(v string) error `,
`{{- if eq $member.RepresentationBehavior.String "string" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodAssignBytes(w io.Writer) {
`AssignBytes(v []byte) error `,
`{{- if eq $member.RepresentationBehavior.String "bytes" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodAssignLink(w io.Writer) {
`AssignLink(v ipld.Link) error `,
`{{- if eq $member.RepresentationBehavior.String "link" }}`,
), w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodAssignNode(w io.Writer) {
// TODO this is too wild for me at the moment, come back to it shortly
// it's basically got some of the body of kindedUnionNodeAssemblerMethodTemplateMunge, but repeated many more times.
// it also needs to handle nulls gingerly.
// and also handle pumping the full copy in the case of lists or maps.
// this is gonna have a fun ErrWrongKind value too -- we might actually have to make a non-static set of acceptable kinds :D that's a first.
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerMethodPrototype(w io.Writer) {
func (na *_{{ .Type | TypeSymbol }}__ReprAssembler) Prototype() ipld.NodePrototype {
return _{{ .Type | TypeSymbol }}__ReprPrototype{}
`, w, g.AdjCfg, g)
func (g unionReprKindedReprBuilderGenerator) EmitNodeAssemblerOtherBits(w io.Writer) {
// somewhat shockingly: nothing.
......@@ -50,6 +50,8 @@ func Generate(pth string, pkgName string, ts schema.TypeSystem, adjCfg *AdjunctC
switch t2.RepresentationStrategy().(type) {
case schema.UnionRepresentation_Keyed:
EmitEntireType(NewUnionReprKeyedGenerator(pkgName, t2, adjCfg), f)
case schema.UnionRepresentation_Kinded:
EmitEntireType(NewUnionReprKindedGenerator(pkgName, t2, adjCfg), f)
panic("unrecognized union representation strategy")
......@@ -2,6 +2,8 @@ package schema
import (
// Everything in this file is __a temporary hack__ and will be __removed__.
......@@ -102,6 +104,9 @@ func SpawnUnion(name TypeName, members []TypeName, repr UnionRepresentation) *Ty
func SpawnUnionRepresentationKeyed(table map[string]TypeName) UnionRepresentation_Keyed {
return UnionRepresentation_Keyed{table}
func SpawnUnionRepresentationKinded(table map[ipld.ReprKind]TypeName) UnionRepresentation_Kinded {
return UnionRepresentation_Kinded{table}
// The methods relating to TypeSystem are also mutation-heavy and placeholdery.
......@@ -73,6 +73,22 @@ type Type interface {
// can vary in representation kind based on their value (specifically,
// kinded-representation unions have this property).
Kind() Kind
// RepresentationBehavior returns a description of how the representation
// of this type will behave in terms of the IPLD Data Model.
// This property varies based on the representation strategy of a type.
// In one case, the representation behavior cannot be known statically,
// and varies based on the data: kinded unions have this trait.
// This property is used by kinded unions, which require that their members
// all have distinct representation behavior.
// (It follows that a kinded union cannot have another kinded union as a member.)
// You may also be interested in a related property that might have been called "TypeBehavior".
// However, this method doesn't exist, because it's a deterministic property of `Kind()`!
// You can use `Kind.ActsLike()` to get type-level behavioral information.
RepresentationBehavior() ipld.ReprKind
var (
package schema
import (
ipld ""
/* cookie-cutter standard interface stuff */
func (t *typeBase) _Type(ts *TypeSystem) {
......@@ -20,6 +24,47 @@ func (TypeUnion) Kind() Kind { return Kind_Union }
func (TypeStruct) Kind() Kind { return Kind_Struct }
func (TypeEnum) Kind() Kind { return Kind_Enum }
func (TypeBool) RepresentationBehavior() ipld.ReprKind { return ipld.ReprKind_Bool }
func (TypeString) RepresentationBehavior() ipld.ReprKind { return ipld.ReprKind_String }
func (TypeBytes) RepresentationBehavior() ipld.ReprKind { return ipld.ReprKind_Bytes }
func (TypeInt) RepresentationBehavior() ipld.ReprKind { return ipld.ReprKind_Int }
func (TypeFloat) RepresentationBehavior() ipld.ReprKind { return ipld.ReprKind_Float }
func (TypeMap) RepresentationBehavior() ipld.ReprKind { return ipld.ReprKind_Map }
func (TypeList) RepresentationBehavior() ipld.ReprKind { return ipld.ReprKind_List }
func (TypeLink) RepresentationBehavior() ipld.ReprKind { return ipld.ReprKind_Link }
func (t TypeUnion) RepresentationBehavior() ipld.ReprKind {
switch t.representation.(type) {
case UnionRepresentation_Keyed:
return ipld.ReprKind_Map
case UnionRepresentation_Kinded:
return ipld.ReprKind_Invalid // you can't know with this one, until you see the value (and thus can its inhabitant's behavior)!
case UnionRepresentation_Envelope:
return ipld.ReprKind_Map
case UnionRepresentation_Inline:
return ipld.ReprKind_Map
func (t TypeStruct) RepresentationBehavior() ipld.ReprKind {
switch t.representation.(type) {
case StructRepresentation_Map:
return ipld.ReprKind_Map
case StructRepresentation_Tuple:
return ipld.ReprKind_List
case StructRepresentation_StringPairs:
return ipld.ReprKind_String
case StructRepresentation_Stringjoin:
return ipld.ReprKind_String
func (t TypeEnum) RepresentationBehavior() ipld.ReprKind {
// TODO: this should have a representation strategy switch too; sometimes that will indicate int representation behavior.
return ipld.ReprKind_String
/* interesting methods per Type type */
// beware: many of these methods will change when we successfully bootstrap self-hosting.
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment