Source code

Revision control

Copy as Markdown

Other Tools

import { RecipeExecutor } from "lib/PersonalityProvider/RecipeExecutor.mjs";
import { tokenize } from "lib/PersonalityProvider/Tokenize.mjs";
class MockTagger {
constructor(mode, tagScoreMap) {
this.mode = mode;
this.tagScoreMap = tagScoreMap;
}
tagTokens() {
if (this.mode === "nb") {
// eslint-disable-next-line prefer-destructuring
let tag = Object.keys(this.tagScoreMap)[0];
// eslint-disable-next-line prefer-destructuring
let prob = this.tagScoreMap[tag];
let conf = prob >= 0.85;
return {
label: tag,
logProb: Math.log(prob),
confident: conf,
};
}
return this.tagScoreMap;
}
tag(text) {
return this.tagTokens([text]);
}
}
describe("RecipeExecutor", () => {
let makeItem = () => {
let x = {
lhs: 2,
one: 1,
two: 2,
three: 3,
foo: "FOO",
bar: "BAR",
baz: ["one", "two", "three"],
qux: 42,
text: "This Is A_sentence.",
map: {
c: 3,
a: 1,
b: 2,
},
map2: {
b: 2,
c: 3,
d: 4,
},
arr1: [2, 3, 4],
arr2: [3, 4, 5],
long: [3, 4, 5, 6, 7],
tags: {
a: {
aa: 0.1,
ab: 0.2,
ac: 0.3,
},
b: {
ba: 4,
bb: 5,
bc: 6,
},
},
bogus: {
a: {
aa: "0.1",
ab: "0.2",
ac: "0.3",
},
b: {
ba: "4",
bb: "5",
bc: "6",
},
},
zero: {
a: 0,
b: 0,
},
zaro: [0, 0],
};
return x;
};
let EPSILON = 0.00001;
let instance = new RecipeExecutor(
[
new MockTagger("nb", { tag1: 0.7 }),
new MockTagger("nb", { tag2: 0.86 }),
new MockTagger("nb", { tag3: 0.9 }),
new MockTagger("nb", { tag5: 0.9 }),
],
{
tag1: new MockTagger("nmf", {
tag11: 0.9,
tag12: 0.8,
tag13: 0.7,
}),
tag2: new MockTagger("nmf", {
tag21: 0.8,
tag22: 0.7,
tag23: 0.6,
}),
tag3: new MockTagger("nmf", {
tag31: 0.7,
tag32: 0.6,
tag33: 0.5,
}),
tag4: new MockTagger("nmf", { tag41: 0.99 }),
},
tokenize
);
let item = null;
beforeEach(() => {
item = makeItem();
});
describe("#_assembleText", () => {
it("should simply copy a single string", () => {
assert.equal(instance._assembleText(item, ["foo"]), "FOO");
});
it("should append some strings with a space", () => {
assert.equal(instance._assembleText(item, ["foo", "bar"]), "FOO BAR");
});
it("should give an empty string for a missing field", () => {
assert.equal(instance._assembleText(item, ["missing"]), "");
});
it("should not double space an interior missing field", () => {
assert.equal(
instance._assembleText(item, ["foo", "missing", "bar"]),
"FOO BAR"
);
});
it("should splice in an array of strings", () => {
assert.equal(
instance._assembleText(item, ["foo", "baz", "bar"]),
"FOO one two three BAR"
);
});
it("should handle numbers", () => {
assert.equal(
instance._assembleText(item, ["foo", "qux", "bar"]),
"FOO 42 BAR"
);
});
});
describe("#naiveBayesTag", () => {
it("should understand NaiveBayesTextTagger", () => {
item = instance.naiveBayesTag(item, { fields: ["text"] });
assert.isTrue("nb_tags" in item);
assert.isTrue(!("tag1" in item.nb_tags));
assert.equal(item.nb_tags.tag2, 0.86);
assert.equal(item.nb_tags.tag3, 0.9);
assert.equal(item.nb_tags.tag5, 0.9);
assert.isTrue("nb_tokens" in item);
assert.deepEqual(item.nb_tokens, ["this", "is", "a", "sentence"]);
assert.isTrue("nb_tags_extended" in item);
assert.isTrue(!("tag1" in item.nb_tags_extended));
assert.deepEqual(item.nb_tags_extended.tag2, {
label: "tag2",
logProb: Math.log(0.86),
confident: true,
});
assert.deepEqual(item.nb_tags_extended.tag3, {
label: "tag3",
logProb: Math.log(0.9),
confident: true,
});
assert.deepEqual(item.nb_tags_extended.tag5, {
label: "tag5",
logProb: Math.log(0.9),
confident: true,
});
assert.isTrue("nb_tokens" in item);
assert.deepEqual(item.nb_tokens, ["this", "is", "a", "sentence"]);
});
});
describe("#conditionallyNmfTag", () => {
it("should do nothing if it's not nb tagged", () => {
item = instance.conditionallyNmfTag(item, {});
assert.equal(item, null);
});
it("should populate nmf tags for the nb tags", () => {
item = instance.naiveBayesTag(item, { fields: ["text"] });
item = instance.conditionallyNmfTag(item, {});
assert.isTrue("nb_tags" in item);
assert.deepEqual(item.nmf_tags, {
tag2: {
tag21: 0.8,
tag22: 0.7,
tag23: 0.6,
},
tag3: {
tag31: 0.7,
tag32: 0.6,
tag33: 0.5,
},
});
assert.deepEqual(item.nmf_tags_parent, {
tag21: "tag2",
tag22: "tag2",
tag23: "tag2",
tag31: "tag3",
tag32: "tag3",
tag33: "tag3",
});
});
it("should not populate nmf tags for things that were not nb tagged", () => {
item = instance.naiveBayesTag(item, { fields: ["text"] });
item = instance.conditionallyNmfTag(item, {});
assert.isTrue("nmf_tags" in item);
assert.isTrue(!("tag4" in item.nmf_tags));
assert.isTrue("nmf_tags_parent" in item);
assert.isTrue(!("tag4" in item.nmf_tags_parent));
});
});
describe("#acceptItemByFieldValue", () => {
it("should implement ==", () => {
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "==",
rhsValue: 2,
}) !== null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "==",
rhsValue: 3,
}) === null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "==",
rhsField: "two",
}) !== null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "==",
rhsField: "three",
}) === null
);
});
it("should implement !=", () => {
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "!=",
rhsValue: 2,
}) === null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "!=",
rhsValue: 3,
}) !== null
);
});
it("should implement < ", () => {
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "<",
rhsValue: 1,
}) === null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "<",
rhsValue: 2,
}) === null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "<",
rhsValue: 3,
}) !== null
);
});
it("should implement <= ", () => {
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "<=",
rhsValue: 1,
}) === null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "<=",
rhsValue: 2,
}) !== null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "<=",
rhsValue: 3,
}) !== null
);
});
it("should implement > ", () => {
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: ">",
rhsValue: 1,
}) !== null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: ">",
rhsValue: 2,
}) === null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: ">",
rhsValue: 3,
}) === null
);
});
it("should implement >= ", () => {
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: ">=",
rhsValue: 1,
}) !== null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: ">=",
rhsValue: 2,
}) !== null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: ">=",
rhsValue: 3,
}) === null
);
});
it("should skip items with missing fields", () => {
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "no-left",
op: "==",
rhsValue: 1,
}) === null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "==",
rhsField: "no-right",
}) === null
);
assert.isTrue(
instance.acceptItemByFieldValue(item, { field: "lhs", op: "==" }) ===
null
);
});
it("should skip items with bogus operators", () => {
assert.isTrue(
instance.acceptItemByFieldValue(item, {
field: "lhs",
op: "bogus",
rhsField: "two",
}) === null
);
});
});
describe("#tokenizeUrl", () => {
it("should strip the leading www from a url", () => {
item = instance.tokenizeUrl(item, { field: "url", dest: "url_toks" });
assert.deepEqual(
[
"wonder",
"example",
"com",
"dir1",
"dir2a",
"dir2b",
"dir3",
"4",
"key1",
"key2",
"val2",
"key3",
"amp",
"3",
"4",
],
item.url_toks
);
});
it("should tokenize the not strip the leading non-wwww token from a url", () => {
item = instance.tokenizeUrl(item, { field: "url2", dest: "url_toks" });
assert.deepEqual(
[
"wonder",
"example",
"com",
"dir1",
"dir2a",
"dir2b",
"dir3",
"4",
"key1",
"key2",
"val2",
"key3",
"amp",
"3",
"4",
],
item.url_toks
);
});
it("should error for a missing url", () => {
item = instance.tokenizeUrl(item, { field: "missing", dest: "url_toks" });
assert.equal(item, null);
});
});
describe("#getUrlDomain", () => {
it("should get only the hostname skipping the www", () => {
item = instance.getUrlDomain(item, { field: "url", dest: "url_domain" });
assert.isTrue("url_domain" in item);
assert.deepEqual("wonder.example.com", item.url_domain);
});
it("should get only the hostname", () => {
item = instance.getUrlDomain(item, { field: "url2", dest: "url_domain" });
assert.isTrue("url_domain" in item);
assert.deepEqual("wonder.example.com", item.url_domain);
});
it("should get the hostname and 2 levels of directories", () => {
item = instance.getUrlDomain(item, {
field: "url",
path_length: 2,
dest: "url_plus_2",
});
assert.isTrue("url_plus_2" in item);
assert.deepEqual("wonder.example.com/dir1/dir2a-dir2b", item.url_plus_2);
});
it("should error for a missing url", () => {
item = instance.getUrlDomain(item, {
field: "missing",
dest: "url_domain",
});
assert.equal(item, null);
});
});
describe("#tokenizeField", () => {
it("should tokenize the field", () => {
item = instance.tokenizeField(item, { field: "text", dest: "toks" });
assert.isTrue("toks" in item);
assert.deepEqual(["this", "is", "a", "sentence"], item.toks);
});
it("should error for a missing field", () => {
item = instance.tokenizeField(item, { field: "missing", dest: "toks" });
assert.equal(item, null);
});
it("should error for a broken config", () => {
item = instance.tokenizeField(item, {});
assert.equal(item, null);
});
});
describe("#_typeOf", () => {
it("should know this is a map", () => {
assert.equal(instance._typeOf({}), "map");
});
it("should know this is an array", () => {
assert.equal(instance._typeOf([]), "array");
});
it("should know this is a string", () => {
assert.equal(instance._typeOf("blah"), "string");
});
it("should know this is a boolean", () => {
assert.equal(instance._typeOf(true), "boolean");
});
it("should know this is a null", () => {
assert.equal(instance._typeOf(null), "null");
});
});
describe("#_lookupScalar", () => {
it("should return the constant", () => {
assert.equal(instance._lookupScalar({}, 1, 0), 1);
});
it("should return the default", () => {
assert.equal(instance._lookupScalar({}, "blah", 42), 42);
});
it("should return the field's value", () => {
assert.equal(instance._lookupScalar({ blah: 11 }, "blah", 42), 11);
});
});
describe("#copyValue", () => {
it("should copy values", () => {
item = instance.copyValue(item, { src: "one", dest: "again" });
assert.isTrue("again" in item);
assert.equal(item.again, 1);
item.one = 100;
assert.equal(item.one, 100);
assert.equal(item.again, 1);
});
it("should handle maps corrects", () => {
item = instance.copyValue(item, { src: "map", dest: "again" });
assert.deepEqual(item.again, { a: 1, b: 2, c: 3 });
item.map.c = 100;
assert.deepEqual(item.again, { a: 1, b: 2, c: 3 });
item.map = 342;
assert.deepEqual(item.again, { a: 1, b: 2, c: 3 });
});
it("should error for a missing field", () => {
item = instance.copyValue(item, { src: "missing", dest: "toks" });
assert.equal(item, null);
});
});
describe("#keepTopK", () => {
it("should keep the 2 smallest", () => {
item = instance.keepTopK(item, { field: "map", k: 2, descending: false });
assert.equal(Object.keys(item.map).length, 2);
assert.isTrue("a" in item.map);
assert.equal(item.map.a, 1);
assert.isTrue("b" in item.map);
assert.equal(item.map.b, 2);
assert.isTrue(!("c" in item.map));
});
it("should keep the 2 largest", () => {
item = instance.keepTopK(item, { field: "map", k: 2, descending: true });
assert.equal(Object.keys(item.map).length, 2);
assert.isTrue(!("a" in item.map));
assert.isTrue("b" in item.map);
assert.equal(item.map.b, 2);
assert.isTrue("c" in item.map);
assert.equal(item.map.c, 3);
});
it("should still keep the 2 largest", () => {
item = instance.keepTopK(item, { field: "map", k: 2 });
assert.equal(Object.keys(item.map).length, 2);
assert.isTrue(!("a" in item.map));
assert.isTrue("b" in item.map);
assert.equal(item.map.b, 2);
assert.isTrue("c" in item.map);
assert.equal(item.map.c, 3);
});
it("should promote up nested fields", () => {
item = instance.keepTopK(item, { field: "tags", k: 2 });
assert.equal(Object.keys(item.tags).length, 2);
assert.deepEqual(item.tags, { bb: 5, bc: 6 });
});
it("should error for a missing field", () => {
item = instance.keepTopK(item, { field: "missing", k: 3 });
assert.equal(item, null);
});
});
describe("#scalarMultiply", () => {
it("should use constants", () => {
item = instance.scalarMultiply(item, { field: "map", k: 2 });
assert.equal(item.map.a, 2);
assert.equal(item.map.b, 4);
assert.equal(item.map.c, 6);
});
it("should use fields", () => {
item = instance.scalarMultiply(item, { field: "map", k: "three" });
assert.equal(item.map.a, 3);
assert.equal(item.map.b, 6);
assert.equal(item.map.c, 9);
});
it("should use default", () => {
item = instance.scalarMultiply(item, {
field: "map",
k: "missing",
dfault: 4,
});
assert.equal(item.map.a, 4);
assert.equal(item.map.b, 8);
assert.equal(item.map.c, 12);
});
it("should error for a missing field", () => {
item = instance.scalarMultiply(item, { field: "missing", k: 3 });
assert.equal(item, null);
});
it("should multiply numbers", () => {
item = instance.scalarMultiply(item, { field: "lhs", k: 2 });
assert.equal(item.lhs, 4);
});
it("should multiply arrays", () => {
item = instance.scalarMultiply(item, { field: "arr1", k: 2 });
assert.deepEqual(item.arr1, [4, 6, 8]);
});
it("should should error on strings", () => {
item = instance.scalarMultiply(item, { field: "foo", k: 2 });
assert.equal(item, null);
});
});
describe("#elementwiseMultiply", () => {
it("should handle maps", () => {
item = instance.elementwiseMultiply(item, {
left: "tags",
right: "map2",
});
assert.deepEqual(item.tags, {
a: { aa: 0, ab: 0, ac: 0 },
b: { ba: 8, bb: 10, bc: 12 },
});
});
it("should handle arrays of same length", () => {
item = instance.elementwiseMultiply(item, {
left: "arr1",
right: "arr2",
});
assert.deepEqual(item.arr1, [6, 12, 20]);
});
it("should error for arrays of different lengths", () => {
item = instance.elementwiseMultiply(item, {
left: "arr1",
right: "long",
});
assert.equal(item, null);
});
it("should error for a missing left", () => {
item = instance.elementwiseMultiply(item, {
left: "missing",
right: "arr2",
});
assert.equal(item, null);
});
it("should error for a missing right", () => {
item = instance.elementwiseMultiply(item, {
left: "arr1",
right: "missing",
});
assert.equal(item, null);
});
it("should handle numbers", () => {
item = instance.elementwiseMultiply(item, {
left: "three",
right: "two",
});
assert.equal(item.three, 6);
});
it("should error for mismatched types", () => {
item = instance.elementwiseMultiply(item, { left: "arr1", right: "two" });
assert.equal(item, null);
});
it("should error for strings", () => {
item = instance.elementwiseMultiply(item, { left: "foo", right: "bar" });
assert.equal(item, null);
});
});
describe("#vectorMultiply", () => {
it("should calculate dot products from maps", () => {
item = instance.vectorMultiply(item, {
left: "map",
right: "map2",
dest: "dot",
});
assert.equal(item.dot, 13);
});
it("should calculate dot products from arrays", () => {
item = instance.vectorMultiply(item, {
left: "arr1",
right: "arr2",
dest: "dot",
});
assert.equal(item.dot, 38);
});
it("should error for arrays of different lengths", () => {
item = instance.vectorMultiply(item, { left: "arr1", right: "long" });
assert.equal(item, null);
});
it("should error for a missing left", () => {
item = instance.vectorMultiply(item, { left: "missing", right: "arr2" });
assert.equal(item, null);
});
it("should error for a missing right", () => {
item = instance.vectorMultiply(item, { left: "arr1", right: "missing" });
assert.equal(item, null);
});
it("should error for mismatched types", () => {
item = instance.vectorMultiply(item, { left: "arr1", right: "two" });
assert.equal(item, null);
});
it("should error for strings", () => {
item = instance.vectorMultiply(item, { left: "foo", right: "bar" });
assert.equal(item, null);
});
});
describe("#scalarAdd", () => {
it("should error for a missing field", () => {
item = instance.scalarAdd(item, { field: "missing", k: 10 });
assert.equal(item, null);
});
it("should error for strings", () => {
item = instance.scalarAdd(item, { field: "foo", k: 10 });
assert.equal(item, null);
});
it("should work for numbers", () => {
item = instance.scalarAdd(item, { field: "one", k: 10 });
assert.equal(item.one, 11);
});
it("should add a constant to every cell on a map", () => {
item = instance.scalarAdd(item, { field: "map", k: 10 });
assert.deepEqual(item.map, { a: 11, b: 12, c: 13 });
});
it("should add a value from a field to every cell on a map", () => {
item = instance.scalarAdd(item, { field: "map", k: "qux" });
assert.deepEqual(item.map, { a: 43, b: 44, c: 45 });
});
it("should add a constant to every cell on an array", () => {
item = instance.scalarAdd(item, { field: "arr1", k: 10 });
assert.deepEqual(item.arr1, [12, 13, 14]);
});
});
describe("#vectorAdd", () => {
it("should calculate add vectors from maps", () => {
item = instance.vectorAdd(item, { left: "map", right: "map2" });
assert.equal(Object.keys(item.map).length, 4);
assert.isTrue("a" in item.map);
assert.equal(item.map.a, 1);
assert.isTrue("b" in item.map);
assert.equal(item.map.b, 4);
assert.isTrue("c" in item.map);
assert.equal(item.map.c, 6);
assert.isTrue("d" in item.map);
assert.equal(item.map.d, 4);
});
it("should work for missing left", () => {
item = instance.vectorAdd(item, { left: "missing", right: "arr2" });
assert.deepEqual(item.missing, [3, 4, 5]);
});
it("should error for missing right", () => {
item = instance.vectorAdd(item, { left: "arr2", right: "missing" });
assert.equal(item, null);
});
it("should error error for strings", () => {
item = instance.vectorAdd(item, { left: "foo", right: "bar" });
assert.equal(item, null);
});
it("should error for different types", () => {
item = instance.vectorAdd(item, { left: "arr2", right: "map" });
assert.equal(item, null);
});
it("should calculate add vectors from arrays", () => {
item = instance.vectorAdd(item, { left: "arr1", right: "arr2" });
assert.deepEqual(item.arr1, [5, 7, 9]);
});
it("should abort on different sized arrays", () => {
item = instance.vectorAdd(item, { left: "arr1", right: "long" });
assert.equal(item, null);
});
it("should calculate add vectors from arrays", () => {
item = instance.vectorAdd(item, { left: "arr1", right: "arr2" });
assert.deepEqual(item.arr1, [5, 7, 9]);
});
});
describe("#makeBoolean", () => {
it("should error for missing field", () => {
item = instance.makeBoolean(item, { field: "missing", threshold: 2 });
assert.equal(item, null);
});
it("should 0/1 a map", () => {
item = instance.makeBoolean(item, { field: "map", threshold: 2 });
assert.deepEqual(item.map, { a: 0, b: 0, c: 1 });
});
it("should a map of all 1s", () => {
item = instance.makeBoolean(item, { field: "map" });
assert.deepEqual(item.map, { a: 1, b: 1, c: 1 });
});
it("should -1/1 a map", () => {
item = instance.makeBoolean(item, {
field: "map",
threshold: 2,
keep_negative: true,
});
assert.deepEqual(item.map, { a: -1, b: -1, c: 1 });
});
it("should work an array", () => {
item = instance.makeBoolean(item, { field: "arr1", threshold: 3 });
assert.deepEqual(item.arr1, [0, 0, 1]);
});
it("should -1/1 an array", () => {
item = instance.makeBoolean(item, {
field: "arr1",
threshold: 3,
keep_negative: true,
});
assert.deepEqual(item.arr1, [-1, -1, 1]);
});
it("should 1 a high number", () => {
item = instance.makeBoolean(item, { field: "qux", threshold: 3 });
assert.equal(item.qux, 1);
});
it("should 0 a low number", () => {
item = instance.makeBoolean(item, { field: "qux", threshold: 70 });
assert.equal(item.qux, 0);
});
it("should -1 a low number", () => {
item = instance.makeBoolean(item, {
field: "qux",
threshold: 83,
keep_negative: true,
});
assert.equal(item.qux, -1);
});
it("should fail a string", () => {
item = instance.makeBoolean(item, { field: "foo", threshold: 3 });
assert.equal(item, null);
});
});
describe("#allowFields", () => {
it("should filter the keys out of a map", () => {
item = instance.allowFields(item, {
fields: ["foo", "missing", "bar"],
});
assert.deepEqual(item, { foo: "FOO", bar: "BAR" });
});
});
describe("#filterByValue", () => {
it("should fail on missing field", () => {
item = instance.filterByValue(item, { field: "missing", threshold: 2 });
assert.equal(item, null);
});
it("should filter the keys out of a map", () => {
item = instance.filterByValue(item, { field: "map", threshold: 2 });
assert.deepEqual(item.map, { c: 3 });
});
});
describe("#l2Normalize", () => {
it("should fail on missing field", () => {
item = instance.l2Normalize(item, { field: "missing" });
assert.equal(item, null);
});
it("should L2 normalize an array", () => {
item = instance.l2Normalize(item, { field: "arr1" });
assert.deepEqual(
item.arr1,
[0.3713906763541037, 0.5570860145311556, 0.7427813527082074]
);
});
it("should L2 normalize a map", () => {
item = instance.l2Normalize(item, { field: "map" });
assert.deepEqual(item.map, {
a: 0.2672612419124244,
b: 0.5345224838248488,
c: 0.8017837257372732,
});
});
it("should fail a string", () => {
item = instance.l2Normalize(item, { field: "foo" });
assert.equal(item, null);
});
it("should not bomb on a zero vector", () => {
item = instance.l2Normalize(item, { field: "zero" });
assert.deepEqual(item.zero, { a: 0, b: 0 });
item = instance.l2Normalize(item, { field: "zaro" });
assert.deepEqual(item.zaro, [0, 0]);
});
});
describe("#probNormalize", () => {
it("should fail on missing field", () => {
item = instance.probNormalize(item, { field: "missing" });
assert.equal(item, null);
});
it("should normalize an array to sum to 1", () => {
item = instance.probNormalize(item, { field: "arr1" });
assert.deepEqual(
item.arr1,
[0.2222222222222222, 0.3333333333333333, 0.4444444444444444]
);
});
it("should normalize a map to sum to 1", () => {
item = instance.probNormalize(item, { field: "map" });
assert.equal(Object.keys(item.map).length, 3);
assert.isTrue("a" in item.map);
assert.isTrue(Math.abs(item.map.a - 0.16667) <= EPSILON);
assert.isTrue("b" in item.map);
assert.isTrue(Math.abs(item.map.b - 0.33333) <= EPSILON);
assert.isTrue("c" in item.map);
assert.isTrue(Math.abs(item.map.c - 0.5) <= EPSILON);
});
it("should fail a string", () => {
item = instance.probNormalize(item, { field: "foo" });
assert.equal(item, null);
});
it("should not bomb on a zero vector", () => {
item = instance.probNormalize(item, { field: "zero" });
assert.deepEqual(item.zero, { a: 0, b: 0 });
item = instance.probNormalize(item, { field: "zaro" });
assert.deepEqual(item.zaro, [0, 0]);
});
});
describe("#scalarMultiplyTag", () => {
it("should fail on missing field", () => {
item = instance.scalarMultiplyTag(item, { field: "missing", k: 3 });
assert.equal(item, null);
});
it("should scalar multiply a nested map", () => {
item = instance.scalarMultiplyTag(item, {
field: "tags",
k: 3,
log_scale: false,
});
assert.isTrue(Math.abs(item.tags.a.aa - 0.3) <= EPSILON);
assert.isTrue(Math.abs(item.tags.a.ab - 0.6) <= EPSILON);
assert.isTrue(Math.abs(item.tags.a.ac - 0.9) <= EPSILON);
assert.isTrue(Math.abs(item.tags.b.ba - 12) <= EPSILON);
assert.isTrue(Math.abs(item.tags.b.bb - 15) <= EPSILON);
assert.isTrue(Math.abs(item.tags.b.bc - 18) <= EPSILON);
});
it("should scalar multiply a nested map with logrithms", () => {
item = instance.scalarMultiplyTag(item, {
field: "tags",
k: 3,
log_scale: true,
});
assert.isTrue(
Math.abs(item.tags.a.aa - Math.log(0.1 + 0.000001) * 3) <= EPSILON
);
assert.isTrue(
Math.abs(item.tags.a.ab - Math.log(0.2 + 0.000001) * 3) <= EPSILON
);
assert.isTrue(
Math.abs(item.tags.a.ac - Math.log(0.3 + 0.000001) * 3) <= EPSILON
);
assert.isTrue(
Math.abs(item.tags.b.ba - Math.log(4.0 + 0.000001) * 3) <= EPSILON
);
assert.isTrue(
Math.abs(item.tags.b.bb - Math.log(5.0 + 0.000001) * 3) <= EPSILON
);
assert.isTrue(
Math.abs(item.tags.b.bc - Math.log(6.0 + 0.000001) * 3) <= EPSILON
);
});
it("should fail a string", () => {
item = instance.scalarMultiplyTag(item, { field: "foo", k: 3 });
assert.equal(item, null);
});
});
describe("#setDefault", () => {
it("should store a missing value", () => {
item = instance.setDefault(item, { field: "missing", value: 1111 });
assert.equal(item.missing, 1111);
});
it("should not overwrite an existing value", () => {
item = instance.setDefault(item, { field: "lhs", value: 1111 });
assert.equal(item.lhs, 2);
});
it("should store a complex value", () => {
item = instance.setDefault(item, { field: "missing", value: { a: 1 } });
assert.deepEqual(item.missing, { a: 1 });
});
});
describe("#lookupValue", () => {
it("should promote a value", () => {
item = instance.lookupValue(item, {
haystack: "map",
needle: "c",
dest: "ccc",
});
assert.equal(item.ccc, 3);
});
it("should handle a missing haystack", () => {
item = instance.lookupValue(item, {
haystack: "missing",
needle: "c",
dest: "ccc",
});
assert.isTrue(!("ccc" in item));
});
it("should handle a missing needle", () => {
item = instance.lookupValue(item, {
haystack: "map",
needle: "missing",
dest: "ccc",
});
assert.isTrue(!("ccc" in item));
});
});
describe("#copyToMap", () => {
it("should copy a value to a map", () => {
item = instance.copyToMap(item, {
src: "qux",
dest_map: "map",
dest_key: "zzz",
});
assert.isTrue("zzz" in item.map);
assert.equal(item.map.zzz, item.qux);
});
it("should create a new map to hold the key", () => {
item = instance.copyToMap(item, {
src: "qux",
dest_map: "missing",
dest_key: "zzz",
});
assert.equal(Object.keys(item.missing).length, 1);
assert.equal(item.missing.zzz, item.qux);
});
it("should not create an empty map if the src is missing", () => {
item = instance.copyToMap(item, {
src: "missing",
dest_map: "no_map",
dest_key: "zzz",
});
assert.isTrue(!("no_map" in item));
});
});
describe("#applySoftmaxTags", () => {
it("should error on missing field", () => {
item = instance.applySoftmaxTags(item, { field: "missing" });
assert.equal(item, null);
});
it("should error on nonmaps", () => {
item = instance.applySoftmaxTags(item, { field: "arr1" });
assert.equal(item, null);
});
it("should error on unnested maps", () => {
item = instance.applySoftmaxTags(item, { field: "map" });
assert.equal(item, null);
});
it("should error on wrong nested maps", () => {
item = instance.applySoftmaxTags(item, { field: "bogus" });
assert.equal(item, null);
});
it("should apply softmax across the subtags", () => {
item = instance.applySoftmaxTags(item, { field: "tags" });
assert.isTrue("a" in item.tags);
assert.isTrue("aa" in item.tags.a);
assert.isTrue("ab" in item.tags.a);
assert.isTrue("ac" in item.tags.a);
assert.isTrue(Math.abs(item.tags.a.aa - 0.30061) <= EPSILON);
assert.isTrue(Math.abs(item.tags.a.ab - 0.33222) <= EPSILON);
assert.isTrue(Math.abs(item.tags.a.ac - 0.36717) <= EPSILON);
assert.isTrue("b" in item.tags);
assert.isTrue("ba" in item.tags.b);
assert.isTrue("bb" in item.tags.b);
assert.isTrue("bc" in item.tags.b);
assert.isTrue(Math.abs(item.tags.b.ba - 0.09003) <= EPSILON);
assert.isTrue(Math.abs(item.tags.b.bb - 0.24473) <= EPSILON);
assert.isTrue(Math.abs(item.tags.b.bc - 0.66524) <= EPSILON);
});
});
describe("#combinerAdd", () => {
it("should do nothing when right field is missing", () => {
let right = makeItem();
let combined = instance.combinerAdd(item, right, { field: "missing" });
assert.deepEqual(combined, item);
});
it("should handle missing left maps", () => {
let right = makeItem();
right.missingmap = { a: 5, b: -1, c: 3 };
let combined = instance.combinerAdd(item, right, { field: "missingmap" });
assert.deepEqual(combined.missingmap, { a: 5, b: -1, c: 3 });
});
it("should add equal sized maps", () => {
let right = makeItem();
let combined = instance.combinerAdd(item, right, { field: "map" });
assert.deepEqual(combined.map, { a: 2, b: 4, c: 6 });
});
it("should add long map to short map", () => {
let right = makeItem();
right.map.d = 999;
let combined = instance.combinerAdd(item, right, { field: "map" });
assert.deepEqual(combined.map, { a: 2, b: 4, c: 6, d: 999 });
});
it("should add short map to long map", () => {
let right = makeItem();
item.map.d = 999;
let combined = instance.combinerAdd(item, right, { field: "map" });
assert.deepEqual(combined.map, { a: 2, b: 4, c: 6, d: 999 });
});
it("should add equal sized arrays", () => {
let right = makeItem();
let combined = instance.combinerAdd(item, right, { field: "arr1" });
assert.deepEqual(combined.arr1, [4, 6, 8]);
});
it("should handle missing left arrays", () => {
let right = makeItem();
right.missingarray = [5, 1, 4];
let combined = instance.combinerAdd(item, right, {
field: "missingarray",
});
assert.deepEqual(combined.missingarray, [5, 1, 4]);
});
it("should add long array to short array", () => {
let right = makeItem();
right.arr1 = [2, 3, 4, 12];
let combined = instance.combinerAdd(item, right, { field: "arr1" });
assert.deepEqual(combined.arr1, [4, 6, 8, 12]);
});
it("should add short array to long array", () => {
let right = makeItem();
item.arr1 = [2, 3, 4, 12];
let combined = instance.combinerAdd(item, right, { field: "arr1" });
assert.deepEqual(combined.arr1, [4, 6, 8, 12]);
});
it("should handle missing left number", () => {
let right = makeItem();
right.missingnumber = 999;
let combined = instance.combinerAdd(item, right, {
field: "missingnumber",
});
assert.deepEqual(combined.missingnumber, 999);
});
it("should add numbers", () => {
let right = makeItem();
let combined = instance.combinerAdd(item, right, { field: "lhs" });
assert.equal(combined.lhs, 4);
});
it("should error on missing left, and right is a string", () => {
let right = makeItem();
right.error = "error";
let combined = instance.combinerAdd(item, right, { field: "error" });
assert.equal(combined, null);
});
it("should error on left string", () => {
let right = makeItem();
let combined = instance.combinerAdd(item, right, { field: "foo" });
assert.equal(combined, null);
});
it("should error on mismatch types", () => {
let right = makeItem();
right.lhs = [1, 2, 3];
let combined = instance.combinerAdd(item, right, { field: "lhs" });
assert.equal(combined, null);
});
});
describe("#combinerMax", () => {
it("should do nothing when right field is missing", () => {
let right = makeItem();
let combined = instance.combinerMax(item, right, { field: "missing" });
assert.deepEqual(combined, item);
});
it("should handle missing left maps", () => {
let right = makeItem();
right.missingmap = { a: 5, b: -1, c: 3 };
let combined = instance.combinerMax(item, right, { field: "missingmap" });
assert.deepEqual(combined.missingmap, { a: 5, b: -1, c: 3 });
});
it("should handle equal sized maps", () => {
let right = makeItem();
right.map = { a: 5, b: -1, c: 3 };
let combined = instance.combinerMax(item, right, { field: "map" });
assert.deepEqual(combined.map, { a: 5, b: 2, c: 3 });
});
it("should handle short map to long map", () => {
let right = makeItem();
right.map = { a: 5, b: -1, c: 3, d: 999 };
let combined = instance.combinerMax(item, right, { field: "map" });
assert.deepEqual(combined.map, { a: 5, b: 2, c: 3, d: 999 });
});
it("should handle long map to short map", () => {
let right = makeItem();
right.map = { a: 5, b: -1, c: 3 };
item.map.d = 999;
let combined = instance.combinerMax(item, right, { field: "map" });
assert.deepEqual(combined.map, { a: 5, b: 2, c: 3, d: 999 });
});
it("should handle equal sized arrays", () => {
let right = makeItem();
right.arr1 = [5, 1, 4];
let combined = instance.combinerMax(item, right, { field: "arr1" });
assert.deepEqual(combined.arr1, [5, 3, 4]);
});
it("should handle missing left arrays", () => {
let right = makeItem();
right.missingarray = [5, 1, 4];
let combined = instance.combinerMax(item, right, {
field: "missingarray",
});
assert.deepEqual(combined.missingarray, [5, 1, 4]);
});
it("should handle short array to long array", () => {
let right = makeItem();
right.arr1 = [5, 1, 4, 7];
let combined = instance.combinerMax(item, right, { field: "arr1" });
assert.deepEqual(combined.arr1, [5, 3, 4, 7]);
});
it("should handle long array to short array", () => {
let right = makeItem();
right.arr1 = [5, 1, 4];
item.arr1.push(7);
let combined = instance.combinerMax(item, right, { field: "arr1" });
assert.deepEqual(combined.arr1, [5, 3, 4, 7]);
});
it("should handle missing left number", () => {
let right = makeItem();
right.missingnumber = 999;
let combined = instance.combinerMax(item, right, {
field: "missingnumber",
});
assert.deepEqual(combined.missingnumber, 999);
});
it("should handle big number", () => {
let right = makeItem();
right.lhs = 99;
let combined = instance.combinerMax(item, right, { field: "lhs" });
assert.equal(combined.lhs, 99);
});
it("should handle small number", () => {
let right = makeItem();
item.lhs = 99;
let combined = instance.combinerMax(item, right, { field: "lhs" });
assert.equal(combined.lhs, 99);
});
it("should error on missing left, and right is a string", () => {
let right = makeItem();
right.error = "error";
let combined = instance.combinerMax(item, right, { field: "error" });
assert.equal(combined, null);
});
it("should error on left string", () => {
let right = makeItem();
let combined = instance.combinerMax(item, right, { field: "foo" });
assert.equal(combined, null);
});
it("should error on mismatch types", () => {
let right = makeItem();
right.lhs = [1, 2, 3];
let combined = instance.combinerMax(item, right, { field: "lhs" });
assert.equal(combined, null);
});
});
describe("#combinerCollectValues", () => {
it("should error on bogus operation", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = 41;
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "missing",
});
assert.equal(combined, null);
});
it("should sum when missing left", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = 41;
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "sum",
});
assert.deepEqual(combined.combined_map, {
"maseratiusa.com/maserati": 41,
});
});
it("should sum when missing right", () => {
let right = makeItem();
item.combined_map = { fake: 42 };
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "sum",
});
assert.deepEqual(combined.combined_map, { fake: 42 });
});
it("should sum when both", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = 41;
item.combined_map = { fake: 42, "maseratiusa.com/maserati": 41 };
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "sum",
});
assert.deepEqual(combined.combined_map, {
fake: 42,
"maseratiusa.com/maserati": 82,
});
});
it("should max when missing left", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = 41;
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "max",
});
assert.deepEqual(combined.combined_map, {
"maseratiusa.com/maserati": 41,
});
});
it("should max when missing right", () => {
let right = makeItem();
item.combined_map = { fake: 42 };
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "max",
});
assert.deepEqual(combined.combined_map, { fake: 42 });
});
it("should max when both (right)", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = 99;
item.combined_map = { fake: 42, "maseratiusa.com/maserati": 41 };
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "max",
});
assert.deepEqual(combined.combined_map, {
fake: 42,
"maseratiusa.com/maserati": 99,
});
});
it("should max when both (left)", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = -99;
item.combined_map = { fake: 42, "maseratiusa.com/maserati": 41 };
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "max",
});
assert.deepEqual(combined.combined_map, {
fake: 42,
"maseratiusa.com/maserati": 41,
});
});
it("should overwrite when missing left", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = 41;
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "overwrite",
});
assert.deepEqual(combined.combined_map, {
"maseratiusa.com/maserati": 41,
});
});
it("should overwrite when missing right", () => {
let right = makeItem();
item.combined_map = { fake: 42 };
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "overwrite",
});
assert.deepEqual(combined.combined_map, { fake: 42 });
});
it("should overwrite when both", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = 41;
item.combined_map = { fake: 42, "maseratiusa.com/maserati": 77 };
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "overwrite",
});
assert.deepEqual(combined.combined_map, {
fake: 42,
"maseratiusa.com/maserati": 41,
});
});
it("should count when missing left", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = 41;
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "count",
});
assert.deepEqual(combined.combined_map, {
"maseratiusa.com/maserati": 1,
});
});
it("should count when missing right", () => {
let right = makeItem();
item.combined_map = { fake: 42 };
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "count",
});
assert.deepEqual(combined.combined_map, { fake: 42 });
});
it("should count when both", () => {
let right = makeItem();
right.url_domain = "maseratiusa.com/maserati";
right.time = 41;
item.combined_map = { fake: 42, "maseratiusa.com/maserati": 1 };
let combined = instance.combinerCollectValues(item, right, {
left_field: "combined_map",
right_key_field: "url_domain",
right_value_field: "time",
operation: "count",
});
assert.deepEqual(combined.combined_map, {
fake: 42,
"maseratiusa.com/maserati": 2,
});
});
});
describe("#executeRecipe", () => {
it("should handle working steps", () => {
let final = instance.executeRecipe({}, [
{ function: "set_default", field: "foo", value: 1 },
{ function: "set_default", field: "bar", value: 10 },
]);
assert.equal(final.foo, 1);
assert.equal(final.bar, 10);
});
it("should handle unknown steps", () => {
let final = instance.executeRecipe({}, [
{ function: "set_default", field: "foo", value: 1 },
{ function: "missing" },
{ function: "set_default", field: "bar", value: 10 },
]);
assert.equal(final, null);
});
it("should handle erroring steps", () => {
let final = instance.executeRecipe({}, [
{ function: "set_default", field: "foo", value: 1 },
{
function: "accept_item_by_field_value",
field: "missing",
op: "invalid",
rhsField: "moot",
rhsValue: "m00t",
},
{ function: "set_default", field: "bar", value: 10 },
]);
assert.equal(final, null);
});
});
describe("#executeCombinerRecipe", () => {
it("should handle working steps", () => {
let final = instance.executeCombinerRecipe(
{ foo: 1, bar: 10 },
{ foo: 1, bar: 10 },
[
{ function: "combiner_add", field: "foo" },
{ function: "combiner_add", field: "bar" },
]
);
assert.equal(final.foo, 2);
assert.equal(final.bar, 20);
});
it("should handle unknown steps", () => {
let final = instance.executeCombinerRecipe(
{ foo: 1, bar: 10 },
{ foo: 1, bar: 10 },
[
{ function: "combiner_add", field: "foo" },
{ function: "missing" },
{ function: "combiner_add", field: "bar" },
]
);
assert.equal(final, null);
});
it("should handle erroring steps", () => {
let final = instance.executeCombinerRecipe(
{ foo: 1, bar: 10, baz: 0 },
{ foo: 1, bar: 10, baz: "hundred" },
[
{ function: "combiner_add", field: "foo" },
{ function: "combiner_add", field: "baz" },
{ function: "combiner_add", field: "bar" },
]
);
assert.equal(final, null);
});
});
});