rewrite, simply and "power-up" unification
This commit is contained in:
parent
d3515d39a5
commit
dfe03eab6e
4 changed files with 211 additions and 175 deletions
|
|
@ -1,10 +1,10 @@
|
|||
import { inspect } from "node:util";
|
||||
import { eqType, getSymbol } from "../primitives/type.js";
|
||||
import { zip } from "../util/util.js";
|
||||
import { pretty, prettyT } from '../util/pretty.js';
|
||||
import { isTypeVar, TYPE_VARS } from "../primitives/typevars.js";
|
||||
import { inspectType } from "../meta/type_constructor.js";
|
||||
import { inspectType, makeTypeConstructor } from "../meta/type_constructor.js";
|
||||
import { getSymbol } from "../primitives/type.js";
|
||||
import { isTypeVar, TYPE_VARS, UNBOUND_SYMBOLS } from "../primitives/typevars.js";
|
||||
import { symbolFunction } from "../structures/type_constructors.js";
|
||||
import { prettyT } from '../util/pretty.js';
|
||||
import { reduceUnif, unifyLL } from "./low_level.js";
|
||||
|
||||
// helper for creating generic types
|
||||
// for instance, the type:
|
||||
|
|
@ -35,137 +35,16 @@ const _occurring = stack => type => {
|
|||
// Get set of type variables in type.
|
||||
export const occurring = _occurring([]);
|
||||
|
||||
// Merge 2 substitution-mappings, uni-directional.
|
||||
const mergeOneWay = (m1, m2) => {
|
||||
const m1copy = new Map(m1);
|
||||
const m2copy = new Map(m2);
|
||||
for (const [symbol1, typ1] of m1copy) {
|
||||
if (m2copy.has(getSymbol(typ1))) {
|
||||
// typ1 is a typeVar for which we also have a substitution
|
||||
// -> fold substitutions
|
||||
m1copy.set(symbol1, m2.get(getSymbol(typ1)));
|
||||
m2copy.delete(getSymbol(typ1));
|
||||
return [false, m1copy, m2copy];
|
||||
}
|
||||
}
|
||||
return [true, m1copy, m2copy]; // stable
|
||||
};
|
||||
|
||||
const checkConflict = (m1, m2) => {
|
||||
for (const [symbol1, typ1] of m1) {
|
||||
if (m2.has(symbol1)) {
|
||||
const other = m2.get(symbol1);
|
||||
if (!eqType(typ1, other)) {
|
||||
throw new Error(`conflicting substitution: ${pretty(typ1)}vs. ${pretty(other)}`);
|
||||
}
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
// Merge 2 substitution-mappings, bi-directional.
|
||||
export const mergeTwoWay = (m1, m2) => {
|
||||
// console.log("mergeTwoWay", {m1, m2});
|
||||
checkConflict(m1, m2);
|
||||
// checkConflict(m2, m1); // <- don't think this is necessary...
|
||||
// actually merge
|
||||
let remaining = 2;
|
||||
while (remaining > 0) {
|
||||
// notice we swap m2 and m1, so the rewriting can happen both ways:
|
||||
let stable;
|
||||
[stable, m2, m1] = mergeOneWay(m1, m2);
|
||||
remaining -= stable;
|
||||
}
|
||||
const result = new Map([...m1, ...m2]);
|
||||
// console.log("mergeTwoWay result =", result);
|
||||
return result;
|
||||
};
|
||||
|
||||
export class UnifyError extends Error {}
|
||||
export class NotAFunctionError extends Error {}
|
||||
|
||||
// Thanks to Hans for pointing out that this algorithm exactly like "Unification" in Prolog (hence the function name):
|
||||
// https://www.dai.ed.ac.uk/groups/ssp/bookpages/quickprolog/node12.html
|
||||
//
|
||||
// Parameters:
|
||||
// typeVars: all the type variables in both fType and aType
|
||||
// fType, aType: generic types to unify
|
||||
// fStack, aStack: internal use.
|
||||
export const __unify = (fType, aType, fStack=[], aStack=[]) => {
|
||||
// console.log("__unify", {typeVars, fType: prettyT(fType), aType: prettyT(aType), fStack, aStack});
|
||||
if (isTypeVar(fType)) {
|
||||
// simplest case: formalType is a type paramater
|
||||
// => substitute with actualType
|
||||
// console.log(`assign ${prettyT(aType)} to ${prettyT(fType)}`);
|
||||
return {
|
||||
substitutions: new Map([[getSymbol(fType), aType]]),
|
||||
type: aType,
|
||||
};
|
||||
}
|
||||
if (isTypeVar(aType)) {
|
||||
// same as above, but in the other direction
|
||||
// console.log(`assign ${prettyT(fType)} to ${prettyT(aType)}`);
|
||||
return {
|
||||
substitutions: new Map([[getSymbol(aType), fType]]),
|
||||
type: fType,
|
||||
};
|
||||
}
|
||||
|
||||
// recursively unify
|
||||
if (fType.symbol !== aType.symbol) {
|
||||
throw new UnifyError(`cannot unify ${prettyT(fType)} and ${prettyT(aType)}`);
|
||||
}
|
||||
|
||||
const fTag = fStack.length;
|
||||
const aTag = aStack.length;
|
||||
|
||||
const unifications =
|
||||
zip(fType.params, aType.params)
|
||||
.map(([getFParam, getAParam]) => {
|
||||
const fParam = getFParam(fTag);
|
||||
const aParam = getAParam(aTag);
|
||||
// type recursively points to an enclosing type that we've already seen
|
||||
if (fStack[fParam] !== aStack[aParam]) {
|
||||
// note that both are also allowed not to be mapped (undefined)
|
||||
throw new UnifyError("cannot unify: types differ in their recursion");
|
||||
}
|
||||
if (fStack[fParam] !== undefined) {
|
||||
const type = fStack[fParam];
|
||||
return () => ({
|
||||
substitutions: new Map(),
|
||||
type,
|
||||
});
|
||||
}
|
||||
return parent => __unify(fParam, aParam,
|
||||
[...fStack, parent],
|
||||
[...aStack, parent]);
|
||||
});
|
||||
|
||||
const unifiedParams = unifications.map(getParam => {
|
||||
return parent => getParam(parent).type;
|
||||
});
|
||||
|
||||
const unifiedSubstitutions = unifications.reduce((acc, getParam) => {
|
||||
const self = Symbol(); // dirty, just need something unique
|
||||
const paramSubstitutions = getParam(self).substitutions;
|
||||
const substitutions = mergeTwoWay(acc, paramSubstitutions);
|
||||
return substitutions;
|
||||
}, new Map());
|
||||
|
||||
return {
|
||||
substitutions: unifiedSubstitutions,
|
||||
type: {
|
||||
symbol: fType.symbol,
|
||||
params: unifiedParams,
|
||||
[inspect.custom]: inspectType,
|
||||
},
|
||||
};
|
||||
};
|
||||
|
||||
export const unify = (fType, aType) => {
|
||||
[fType, aType] = recomputeTypeVars([fType, aType]);
|
||||
const {type, substitutions} = __unify(fType, aType);
|
||||
// console.log('unification complete! substitutions:', substitutions);
|
||||
return recomputeTypeVars([type])[0];
|
||||
const unification = unifyLL(fType, aType);
|
||||
const substitutions = reduceUnif(unification);
|
||||
const uType = substitute(fType, // or aType, doesn't matter here
|
||||
substitutions);
|
||||
return recomputeTypeVars([uType])[0];
|
||||
};
|
||||
|
||||
export const substitute = (type, substitutions, stack=[]) => {
|
||||
|
|
@ -188,41 +67,42 @@ export const substitute = (type, substitutions, stack=[]) => {
|
|||
};
|
||||
};
|
||||
|
||||
export const assignFn = (funType, paramType) => {
|
||||
const [inType, inSubst, outType, outSubst] = assignFnSubstitutions(funType, paramType);
|
||||
// return recomputeTypeVars([outType])[0];
|
||||
return outType;
|
||||
};
|
||||
|
||||
// same as above, but also returns the substitutions that took place
|
||||
export const assignFnSubstitutions = (funType, paramType, skip=0) => {
|
||||
export const assignFn = (funType, paramType, skip=0) => {
|
||||
// Precondition
|
||||
if (getSymbol(funType) !== symbolFunction) {
|
||||
throw new NotAFunctionError(`${prettyT(funType)} is not a function type!`);
|
||||
}
|
||||
const [[refunType, funS], [reparamType, paramS]] = recomputeTypeVarsSubstitutions([funType, paramType], skip);
|
||||
const [inType, outType] = refunType.params.map(p => p(refunType));
|
||||
const {type: newInType, substitutions} = __unify(inType, reparamType);
|
||||
const totalParamSubstitutions = mergeTwoWay(substitutions, paramS);
|
||||
const newOutType = substitute(outType, substitutions);
|
||||
const [[finalOutType, outsubst]] = recomputeTypeVarsSubstitutions([newOutType], skip);
|
||||
const totalOutSubstitutions = mergeTwoWay(funS, outsubst);
|
||||
return [newInType, totalParamSubstitutions, finalOutType, totalOutSubstitutions];
|
||||
};
|
||||
|
||||
// Step 1: Very important: Function and parameter type may have overlapping type variables, so we recompute them to make them non-overlapping:
|
||||
const [funType1, paramType1] = recomputeTypeVars([funType, paramType]);
|
||||
|
||||
// Step 2: Get input and output type of function
|
||||
const [inType1, outType1] = funType1.params.map(p => p(funType1));
|
||||
|
||||
// Step 3: Unify parameter type with input type
|
||||
const unifInType1 = unifyLL(inType1, paramType1);
|
||||
|
||||
// Step 4: Substitute typevars in output type
|
||||
const substInType1 = reduceUnif(unifInType1);
|
||||
const reducedOutType1 = substitute(outType1, substInType1);
|
||||
|
||||
// Step 5: 'Normalize' output type
|
||||
const [outType] = recomputeTypeVars([reducedOutType1], skip);
|
||||
return outType;
|
||||
}
|
||||
|
||||
// Ensures that no type variables overlap
|
||||
export const recomputeTypeVars = types => {
|
||||
return recomputeTypeVarsSubstitutions(types)
|
||||
.map(([newType, _subst]) => newType);
|
||||
};
|
||||
|
||||
export const recomputeTypeVarsSubstitutions = (types, skip=0) => {
|
||||
export const recomputeTypeVars = (types, skip=0) => {
|
||||
let nextIdx = skip;
|
||||
return types.map(type => {
|
||||
const substitutions = new Map();
|
||||
const typeVars = occurring(type);
|
||||
for (const typeVar of typeVars) {
|
||||
substitutions.set(typeVar, TYPE_VARS[nextIdx++]);
|
||||
}
|
||||
return [substitute(type, substitutions), substitutions];
|
||||
});
|
||||
const substitutions = new Map();
|
||||
const typeVars = occurring(type);
|
||||
for (const typeVar of typeVars) {
|
||||
const idx = nextIdx++;
|
||||
if (typeVar !== UNBOUND_SYMBOLS[idx]) {
|
||||
substitutions.set(typeVar, TYPE_VARS[idx]);
|
||||
}
|
||||
}
|
||||
return substitute(type, substitutions);
|
||||
});
|
||||
};
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue