| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461 |
- // Experimental
- var sklearn = sklearn || {};
- sklearn.ModelFactory = class {
- match(context) {
- const obj = context.open('pkl');
- const validate = (obj, name) => {
- if (obj && obj.__class__ && obj.__class__.__module__ && obj.__class__.__name__) {
- const key = obj.__class__.__module__ + '.' + obj.__class__.__name__;
- return key.startsWith(name);
- }
- return false;
- };
- const formats = [
- { name: 'sklearn.', format: 'sklearn' },
- { name: 'xgboost.sklearn.', format: 'sklearn' },
- { name: 'lightgbm.sklearn.', format: 'sklearn' },
- { name: 'scipy.', format: 'scipy' },
- { name: 'hmmlearn.', format: 'hmmlearn' }
- ];
- for (const format of formats) {
- if (validate(obj, format.name)) {
- return format.format;
- }
- if (Array.isArray(obj) && obj.length > 0 && obj.every((item) => validate(item, format.name))) {
- return format.format + '.list';
- }
- if (Object(obj) === obj) {
- const entries = Object.entries(obj);
- if (entries.length > 0 && entries.every((entry) => validate(entry[1], format.name))) {
- return format.format + '.map';
- }
- }
- }
- return null;
- }
- async open(context, target) {
- const metadata = await context.metadata('sklearn-metadata.json');
- const obj = context.open('pkl');
- return new sklearn.Model(metadata, target, obj);
- }
- };
- sklearn.Model = class {
- constructor(metadata, target, obj) {
- const formats = new Map([ [ 'sklearn', 'scikit-learn' ], [ 'scipy', 'SciPy' ], [ 'hmmlearn', 'hmmlearn' ] ]);
- this._format = formats.get(target.split('.').shift());
- this._graphs = [];
- const version = [];
- switch (target) {
- case 'sklearn':
- case 'scipy':
- case 'hmmlearn': {
- if (obj._sklearn_version) {
- version.push(' v' + obj._sklearn_version.toString());
- }
- this._graphs.push(new sklearn.Graph(metadata, '', obj));
- break;
- }
- case 'sklearn.list':
- case 'scipy.list': {
- const list = obj;
- for (let i = 0; i < list.length; i++) {
- const obj = list[i];
- this._graphs.push(new sklearn.Graph(metadata, i.toString(), obj));
- if (obj._sklearn_version) {
- version.push(' v' + obj._sklearn_version.toString());
- }
- }
- break;
- }
- case 'sklearn.map':
- case 'scipy.map': {
- for (const entry of Object.entries(obj)) {
- const obj = entry[1];
- this._graphs.push(new sklearn.Graph(metadata, entry[0], obj));
- if (obj._sklearn_version) {
- version.push(' v' + obj._sklearn_version.toString());
- }
- }
- break;
- }
- default: {
- throw new sklearn.Error("Unsupported scikit-learn format '" + target + "'.");
- }
- }
- if (version.length > 0 && version.every((value) => value === version[0])) {
- this._format += version[0];
- }
- }
- get format() {
- return this._format;
- }
- get graphs() {
- return this._graphs;
- }
- };
- sklearn.Graph = class {
- constructor(metadata, name, obj) {
- this._name = name || '';
- this._metadata = metadata;
- this._nodes = [];
- this._groups = false;
- const values = new Map();
- const value = (name) => {
- if (!values.has(name)) {
- values.set(name, new sklearn.Value(name, null, null));
- }
- return values.get(name);
- };
- const concat = (parent, name) => {
- return (parent === '' ? name : `${parent}/${name}`);
- };
- const process = (group, name, obj, inputs) => {
- const type = obj.__class__.__module__ + '.' + obj.__class__.__name__;
- switch (type) {
- case 'sklearn.pipeline.Pipeline': {
- this._groups = true;
- name = name || 'pipeline';
- const childGroup = concat(group, name);
- for (const step of obj.steps) {
- inputs = process(childGroup, step[0], step[1], inputs);
- }
- return inputs;
- }
- case 'sklearn.pipeline.FeatureUnion': {
- this._groups = true;
- const outputs = [];
- name = name || 'union';
- const output = concat(group, name);
- const subgroup = concat(group, name);
- this._nodes.push(new sklearn.Node(this._metadata, subgroup, output, obj, inputs, [ output ], value));
- for (const transformer of obj.transformer_list) {
- outputs.push(...process(subgroup, transformer[0], transformer[1], [ output ]));
- }
- return outputs;
- }
- case 'sklearn.compose._column_transformer.ColumnTransformer': {
- this._groups = true;
- name = name || 'transformer';
- const output = concat(group, name);
- const subgroup = concat(group, name);
- const outputs = [];
- this._nodes.push(new sklearn.Node(this._metadata, subgroup, output, obj, inputs, [ output ], value));
- for (const transformer of obj.transformers) {
- if (transformer[1] !== 'passthrough') {
- outputs.push(...process(subgroup, transformer[0], transformer[1], [ output ]));
- }
- }
- return outputs;
- }
- default: {
- const output = concat(group, name);
- this._nodes.push(new sklearn.Node(this._metadata, group, output, obj, inputs, output === '' ? [] : [ output ], value));
- return [ output ];
- }
- }
- };
- process('', '', obj, ['data']);
- }
- get name() {
- return this._name;
- }
- get groups() {
- return this._groups;
- }
- get inputs() {
- return [];
- }
- get outputs() {
- return [];
- }
- get nodes() {
- return this._nodes;
- }
- };
- sklearn.Argument = class {
- constructor(name, value) {
- this._name = name;
- this._value = value;
- }
- get name() {
- return this._name;
- }
- get value() {
- return this._value;
- }
- };
- sklearn.Value = class {
- constructor(name, type, initializer) {
- if (typeof name !== 'string') {
- throw new sklearn.Error("Invalid value identifier '" + JSON.stringify(name) + "'.");
- }
- this._name = name;
- this._type = type || null;
- this._initializer = initializer || null;
- }
- get name() {
- return this._name;
- }
- get type() {
- if (this._initializer) {
- return this._initializer.type;
- }
- return this._type;
- }
- get initializer() {
- return this._initializer;
- }
- };
- sklearn.Node = class {
- constructor(metadata, group, name, obj, inputs, outputs, value) {
- this._group = group || '';
- this._name = name || '';
- const type = obj.__class__ ? obj.__class__.__module__ + '.' + obj.__class__.__name__ : 'Object';
- this._type = metadata.type(type) || { name: type };
- this._inputs = inputs.map((input) => new sklearn.Argument(input, [ value(input) ]));
- this._outputs = outputs.map((output) => new sklearn.Argument(output, [ value(output) ]));
- this._attributes = [];
- for (const entry of Object.entries(obj)) {
- const name = entry[0];
- const value = entry[1];
- if (value && sklearn.Utility.isTensor(value)) {
- const argument = new sklearn.Argument(name, [ new sklearn.Value('', null, new sklearn.Tensor(value)) ]);
- this._inputs.push(argument);
- } else if (Array.isArray(value) && value.every((obj) => sklearn.Utility.isTensor(obj))) {
- const argument = new sklearn.Argument(name, value.map((obj) => new sklearn.Value('', null, new sklearn.Tensor(obj))));
- this._inputs.push(argument);
- } else if (!name.startsWith('_')) {
- const attribute = new sklearn.Attribute(metadata.attribute(type, name), name, value);
- this._attributes.push(attribute);
- }
- }
- }
- get type() {
- return this._type; // .split('.').pop();
- }
- get name() {
- return this._name;
- }
- get group() {
- return this._group ? this._group : null;
- }
- get inputs() {
- return this._inputs;
- }
- get outputs() {
- return this._outputs;
- }
- get attributes() {
- return this._attributes;
- }
- };
- sklearn.Attribute = class {
- constructor(metadata, name, value) {
- this._name = name;
- this._value = value;
- if (metadata) {
- if (metadata.optional && this._value == null) {
- this._visible = false;
- } else if (metadata.visible === false) {
- this._visible = false;
- } else if (metadata.default !== undefined) {
- if (Array.isArray(value)) {
- if (Array.isArray(metadata.default)) {
- this._visible = value.length !== metadata.default || !this.value.every((item, index) => item == metadata.default[index]);
- } else {
- this._visible = !this.value.every((item) => item == metadata.default);
- }
- } else {
- this._visible = this.value !== metadata.default;
- }
- }
- }
- if (value) {
- if (Array.isArray(value) && value.length > 0 && value.every((obj) => obj.__class__ && obj.__class__.__module__ === value[0].__class__.__module__ && obj.__class__.__name__ === value[0].__class__.__name__)) {
- this._type = value[0].__class__.__module__ + '.' + value[0].__class__.__name__ + '[]';
- } else if (value.__class__) {
- this._type = value.__class__.__module__ + '.' + value.__class__.__name__;
- }
- }
- }
- get name() {
- return this._name;
- }
- get value() {
- return this._value;
- }
- get type() {
- return this._type;
- }
- get visible() {
- return this._visible == false ? false : true;
- }
- };
- sklearn.Tensor = class {
- constructor(array) {
- if (!sklearn.Utility.isTensor(array)) {
- const type = array.__class__.__module__ + '.' + array.__class__.__name__;
- throw new sklearn.Error("Unsupported tensor type '" + type + "'.");
- }
- this._type = new sklearn.TensorType(array.dtype.__name__, new sklearn.TensorShape(array.shape));
- this._byteorder = array.dtype.byteorder;
- this._data = this._type.dataType == 'string' || this._type.dataType == 'object' ? array.tolist() : array.tobytes();
- }
- get type() {
- return this._type;
- }
- get category() {
- return 'NumPy Array';
- }
- get layout() {
- return this._type.dataType == 'string' || this._type.dataType == 'object' ? '|' : this._byteorder;
- }
- get values() {
- return this._data;
- }
- };
- sklearn.TensorType = class {
- constructor(dataType, shape) {
- this._dataType = dataType;
- this._shape = shape;
- }
- get dataType() {
- return this._dataType;
- }
- get shape() {
- return this._shape;
- }
- toString() {
- return this.dataType + this._shape.toString();
- }
- };
- sklearn.TensorShape = class {
- constructor(dimensions) {
- this._dimensions = dimensions;
- }
- get dimensions() {
- return this._dimensions;
- }
- toString() {
- return this._dimensions ? ('[' + this._dimensions.map((dimension) => dimension.toString()).join(',') + ']') : '';
- }
- };
- sklearn.Utility = class {
- static isTensor(obj) {
- return obj && obj.__class__ && obj.__class__.__module__ === 'numpy' && obj.__class__.__name__ === 'ndarray';
- }
- static findWeights(obj) {
- const keys = [ '', 'blobs' ];
- for (const key of keys) {
- const dict = key === '' ? obj : obj[key];
- if (dict) {
- const weights = new Map();
- if (dict instanceof Map) {
- for (const pair of dict) {
- if (!sklearn.Utility.isTensor(pair[1])) {
- return null;
- }
- weights.set(pair[0], pair[1]);
- }
- return weights;
- } else if (!Array.isArray(dict)) {
- for (const key in dict) {
- const value = dict[key];
- if (key != 'weight_order' && key != 'lr') {
- if (!key || !sklearn.Utility.isTensor(value)) {
- return null;
- }
- weights.set(key, value);
- }
- }
- return weights;
- }
- }
- }
- for (const key of keys) {
- const list = key === '' ? obj : obj[key];
- if (list && Array.isArray(list)) {
- const weights = new Map();
- for (let i = 0; i < list.length; i++) {
- const value = list[i];
- if (!sklearn.Utility.isTensor(value, 'numpy.ndarray')) {
- return null;
- }
- weights.set(i.toString(), value);
- }
- return weights;
- }
- }
- return null;
- }
- };
- sklearn.Error = class extends Error {
- constructor(message) {
- super(message);
- this.name = 'Error loading scikit-learn model.';
- }
- };
- if (typeof module !== 'undefined' && typeof module.exports === 'object') {
- module.exports.ModelFactory = sklearn.ModelFactory;
- }
|