| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634 |
- // Experimental
- var sklearn = sklearn || {};
- sklearn.ModelFactory = class {
- match(context) {
- const obj = context.open('pkl');
- const validate = (obj, name) => {
- if (obj && obj.__class__ && obj.__class__.__module__ && obj.__class__.__name__) {
- const key = obj.__class__.__module__ + '.' + obj.__class__.__name__;
- return key.startsWith(name);
- }
- return false;
- };
- const formats = [
- { name: 'sklearn.', format: 'sklearn' },
- { name: 'xgboost.sklearn.', format: 'sklearn' },
- { name: 'lightgbm.sklearn.', format: 'sklearn' },
- { name: 'scipy.', format: 'scipy' },
- { name: 'hmmlearn.', format: 'hmmlearn' }
- ];
- for (const format of formats) {
- if (validate(obj, format.name)) {
- return format.format;
- }
- if (Array.isArray(obj) && obj.every((item) => validate(item, format.name))) {
- return format.format + '.list';
- }
- if ((Object(obj) === obj) && Object.entries(obj).every((entry) => validate(entry[1], format.name))) {
- return format.format + '.map';
- }
- }
- return undefined;
- }
- open(context, match) {
- return context.metadata('sklearn-metadata.json').then((metadata) => {
- const obj = context.open('pkl');
- return new sklearn.Model(metadata, match, obj);
- });
- }
- };
- sklearn.Model = class {
- constructor(metadata, match, obj) {
- const formats = new Map([ [ 'sklearn', 'scikit-learn' ], [ 'scipy', 'SciPy' ], [ 'hmmlearn', 'hmmlearn' ] ]);
- this._format = formats.get(match.split('.').shift());
- this._graphs = [];
- const version = [];
- switch (match) {
- case 'sklearn':
- case 'scipy':
- case 'hmmlearn': {
- version.push(obj._sklearn_version ? ' v' + obj._sklearn_version.toString() : '');
- this._graphs.push(new sklearn.Graph(metadata, '', obj));
- break;
- }
- case 'sklearn.list':
- case 'scipy.list': {
- const list = obj;
- for (let i = 0; i < list.length; i++) {
- const obj = list[i];
- this._graphs.push(new sklearn.Graph(metadata, i.toString(), obj));
- version.push(obj._sklearn_version ? ' v' + obj._sklearn_version.toString() : '');
- }
- break;
- }
- case 'sklearn.map':
- case 'scipy.map': {
- for (const entry of Object.entries(obj)) {
- const obj = entry[1];
- this._graphs.push(new sklearn.Graph(metadata, entry[0], obj));
- version.push(obj._sklearn_version ? ' v' + obj._sklearn_version.toString() : '');
- }
- break;
- }
- default: {
- throw new sklearn.Error("Unsupported scikit-learn format '" + match + "'.");
- }
- }
- if (version.every((value) => value === version[0])) {
- this._format += version[0];
- }
- }
- get format() {
- return this._format;
- }
- get graphs() {
- return this._graphs;
- }
- };
- sklearn.Graph = class {
- constructor(metadata, name, obj) {
- this._name = name || '';
- this._metadata = metadata;
- this._nodes = [];
- this._groups = false;
- this._process('', '', obj, ['data']);
- }
- _process(group, name, obj, inputs) {
- const type = obj.__class__.__module__ + '.' + obj.__class__.__name__;
- switch (type) {
- case 'sklearn.pipeline.Pipeline': {
- this._groups = true;
- name = name || 'pipeline';
- const childGroup = this._concat(group, name);
- for (const step of obj.steps) {
- inputs = this._process(childGroup, step[0], step[1], inputs);
- }
- return inputs;
- }
- case 'sklearn.pipeline.FeatureUnion': {
- this._groups = true;
- const outputs = [];
- name = name || 'union';
- const output = this._concat(group, name);
- const subgroup = this._concat(group, name);
- this._nodes.push(new sklearn.Node(this._metadata, subgroup, output, obj, inputs, [ output ]));
- for (const transformer of obj.transformer_list){
- outputs.push(...this._process(subgroup, transformer[0], transformer[1], [ output ]));
- }
- return outputs;
- }
- case 'sklearn.compose._column_transformer.ColumnTransformer': {
- this._groups = true;
- name = name || 'transformer';
- const output = this._concat(group, name);
- const subgroup = this._concat(group, name);
- const outputs = [];
- this._nodes.push(new sklearn.Node(this._metadata, subgroup, output, obj, inputs, [ output ]));
- for (const transformer of obj.transformers){
- if (transformer[1] !== 'passthrough') {
- outputs.push(...this._process(subgroup, transformer[0], transformer[1], [ output ]));
- }
- }
- return outputs;
- }
- default: {
- const output = this._concat(group, name);
- this._nodes.push(new sklearn.Node(this._metadata, group, output, obj, inputs, output === '' ? [] : [ output ]));
- return [ output ];
- }
- }
- }
- _concat(parent, name){
- return (parent === '' ? name : `${parent}/${name}`);
- }
- get name() {
- return this._name;
- }
- get groups() {
- return this._groups;
- }
- get inputs() {
- return [];
- }
- get outputs() {
- return [];
- }
- get nodes() {
- return this._nodes;
- }
- };
- sklearn.Parameter = class {
- constructor(name, args) {
- this._name = name;
- this._arguments = args;
- }
- get name() {
- return this._name;
- }
- get visible() {
- return true;
- }
- get arguments() {
- return this._arguments;
- }
- };
- sklearn.Argument = class {
- constructor(name, type, initializer) {
- if (typeof name !== 'string') {
- throw new sklearn.Error("Invalid argument identifier '" + JSON.stringify(name) + "'.");
- }
- this._name = name;
- this._type = type || null;
- this._initializer = initializer || null;
- }
- get name() {
- return this._name;
- }
- get type() {
- if (this._initializer) {
- return this._initializer.type;
- }
- return this._type;
- }
- get initializer() {
- return this._initializer;
- }
- };
- sklearn.Node = class {
- constructor(metadata, group, name, obj, inputs, outputs) {
- this._group = group || '';
- this._name = name || '';
- const type = obj.__class__ ? obj.__class__.__module__ + '.' + obj.__class__.__name__ : 'Object';
- this._type = metadata.type(type) || { name: type };
- this._inputs = inputs.map((input) => new sklearn.Parameter(input, [ new sklearn.Argument(input, null, null) ]));
- this._outputs = outputs.map((output) => new sklearn.Parameter(output, [ new sklearn.Argument(output, null, null) ]));
- this._attributes = [];
- for (const entry of Object.entries(obj)) {
- const name = entry[0];
- const value = entry[1];
- if (value && sklearn.Utility.isTensor(value)) {
- const argument = new sklearn.Argument('', null, new sklearn.Tensor(value));
- const paramter = new sklearn.Parameter(name, [ argument ]);
- this._inputs.push(paramter);
- }
- else if (Array.isArray(value) && value.every((obj) => sklearn.Utility.isTensor(obj))) {
- const args = value.map((obj) => new sklearn.Argument('', null, new sklearn.Tensor(obj)));
- const paramter = new sklearn.Parameter(name, args);
- this._inputs.push(paramter);
- }
- else if (!name.startsWith('_')) {
- const attribute = new sklearn.Attribute(metadata.attribute(type, name), name, value);
- this._attributes.push(attribute);
- }
- }
- }
- get type() {
- return this._type; // .split('.').pop();
- }
- get name() {
- return this._name;
- }
- get group() {
- return this._group ? this._group : null;
- }
- get inputs() {
- return this._inputs;
- }
- get outputs() {
- return this._outputs;
- }
- get attributes() {
- return this._attributes;
- }
- };
- sklearn.Attribute = class {
- constructor(metadata, name, value) {
- this._name = name;
- this._value = value;
- if (metadata) {
- if (metadata.optional && this._value == null) {
- this._visible = false;
- }
- else if (metadata.visible === false) {
- this._visible = false;
- }
- else if (metadata.default !== undefined) {
- if (Array.isArray(value)) {
- if (Array.isArray(metadata.default)) {
- this._visible = value.length !== metadata.default || !this.value.every((item, index) => item == metadata.default[index]);
- }
- else {
- this._visible = !this.value.every((item) => item == metadata.default);
- }
- }
- else {
- this._visible = this.value !== metadata.default;
- }
- }
- }
- if (value) {
- if (Array.isArray(value) && value.length > 0 && value.every((obj) => obj.__class__ && obj.__class__.__module__ === value[0].__class__.__module__ && obj.__class__.__name__ === value[0].__class__.__name__)) {
- this._type = value[0].__class__.__module__ + '.' + value[0].__class__.__name__ + '[]';
- }
- else if (value.__class__) {
- this._type = value.__class__.__module__ + '.' + value.__class__.__name__;
- }
- }
- }
- get name() {
- return this._name;
- }
- get value() {
- return this._value;
- }
- get type() {
- return this._type;
- }
- get visible() {
- return this._visible == false ? false : true;
- }
- };
- sklearn.Tensor = class {
- constructor(value) {
- if (!sklearn.Utility.isTensor(value)) {
- const type = value.__class__.__module__ + '.' + value.__class__.__name__;
- throw new sklearn.Error("Unsupported tensor type '" + type + "'.");
- }
- this._type = new sklearn.TensorType(value.dtype.__name__, new sklearn.TensorShape(value.shape));
- this._data = value.data;
- if (this._type.dataType === 'string') {
- this._itemsize = value.dtype.itemsize;
- }
- }
- get type() {
- return this._type;
- }
- get kind() {
- return 'NumPy Array';
- }
- get state() {
- return this._context().state || null;
- }
- get value() {
- const context = this._context();
- if (context.state) {
- return null;
- }
- context.limit = Number.MAX_SAFE_INTEGER;
- return this._decode(context, 0);
- }
- toString() {
- const context = this._context();
- if (context.state) {
- return '';
- }
- context.limit = 10000;
- const value = this._decode(context, 0);
- switch (this._type.dataType) {
- case 'int64':
- case 'uint64':
- return sklearn.Tensor._stringify(value, '', ' ');
- default:
- break;
- }
- return JSON.stringify(value, null, 4);
- }
- _context() {
- const context = {};
- context.index = 0;
- context.count = 0;
- context.state = null;
- if (!this._type) {
- context.state = 'Tensor has no data type.';
- return context;
- }
- if (!this._data) {
- context.state = 'Tensor is data is empty.';
- return context;
- }
- context.dataType = this._type.dataType;
- context.dimensions = this._type.shape.dimensions;
- switch (context.dataType) {
- case 'float32':
- case 'float64':
- case 'uint32':
- case 'int8':
- case 'int16':
- case 'int32':
- case 'int64':
- case 'uint64':
- context.view = new DataView(this._data.buffer, this._data.byteOffset, this._data.byteLength);
- break;
- case 'string':
- context.data = this._data;
- context.itemsize = this._itemsize;
- context.decoder = new TextDecoder('utf-8');
- break;
- case 'object':
- context.data = this._data;
- break;
- default:
- context.state = "Tensor data type '" + context.dataType + "' is not implemented.";
- return context;
- }
- return context;
- }
- _decode(context, dimension) {
- const results = [];
- const size = context.dimensions[dimension];
- if (dimension == context.dimensions.length - 1) {
- for (let i = 0; i < size; i++) {
- if (context.count > context.limit) {
- results.push('...');
- return results;
- }
- switch (context.dataType) {
- case 'float32': {
- results.push(context.view.getFloat32(context.index, true));
- context.index += 4;
- context.count++;
- break;
- }
- case 'float64': {
- results.push(context.view.getFloat64(context.index, true));
- context.index += 8;
- context.count++;
- break;
- }
- case 'int8': {
- results.push(context.view.getInt8(context.index, true));
- context.index += 1;
- context.count++;
- break;
- }
- case 'int16': {
- results.push(context.view.getInt16(context.index, true));
- context.index += 2;
- context.count++;
- break;
- }
- case 'int32': {
- results.push(context.view.getInt32(context.index, true));
- context.index += 4;
- context.count++;
- break;
- }
- case 'int64': {
- results.push(context.view.getInt64(context.index, true));
- context.index += 8;
- context.count++;
- break;
- }
- case 'uint32': {
- results.push(context.view.getUint32(context.index, true));
- context.index += 4;
- context.count++;
- break;
- }
- case 'uint64': {
- results.push(context.view.getUint64(context.index, true));
- context.index += 8;
- context.count++;
- break;
- }
- case 'string': {
- const buffer = context.data.subarray(context.index, context.index + context.itemsize);
- const index = buffer.indexOf(0);
- const content = context.decoder.decode(index >= 0 ? buffer.subarray(0, index) : buffer);
- results.push(content);
- context.index += context.itemsize;
- context.count++;
- break;
- }
- case 'object': {
- results.push(context.data[context.index++]);
- context.count++;
- break;
- }
- default: {
- throw new sklearn.Error("Unsupported tensor data type '" + context.dataType + "'.");
- }
- }
- }
- }
- else {
- for (let j = 0; j < size; j++) {
- if (context.count > context.limit) {
- results.push('...');
- return results;
- }
- results.push(this._decode(context, dimension + 1));
- }
- }
- return results;
- }
- static _stringify(value, indentation, indent) {
- if (Array.isArray(value)) {
- const result = [];
- result.push('[');
- const items = value.map((item) => sklearn.Tensor._stringify(item, indentation + indent, indent));
- if (items.length > 0) {
- result.push(items.join(',\n'));
- }
- result.push(']');
- return result.join('\n');
- }
- return indentation + value.toString();
- }
- };
- sklearn.TensorType = class {
- constructor(dataType, shape) {
- this._dataType = dataType;
- this._shape = shape;
- }
- get dataType() {
- return this._dataType;
- }
- get shape() {
- return this._shape;
- }
- toString() {
- return this.dataType + this._shape.toString();
- }
- };
- sklearn.TensorShape = class {
- constructor(dimensions) {
- this._dimensions = dimensions;
- }
- get dimensions() {
- return this._dimensions;
- }
- toString() {
- return this._dimensions ? ('[' + this._dimensions.map((dimension) => dimension.toString()).join(',') + ']') : '';
- }
- };
- sklearn.Utility = class {
- static isTensor(obj) {
- return obj && obj.__class__ && obj.__class__.__module__ === 'numpy' && obj.__class__.__name__ === 'ndarray';
- }
- static findWeights(obj) {
- const keys = [ '', 'blobs' ];
- for (const key of keys) {
- const dict = key === '' ? obj : obj[key];
- if (dict) {
- const weights = new Map();
- if (dict instanceof Map) {
- for (const pair of dict) {
- if (!sklearn.Utility.isTensor(pair[1])) {
- return null;
- }
- weights.set(pair[0], pair[1]);
- }
- return weights;
- }
- else if (!Array.isArray(dict)) {
- for (const key in dict) {
- const value = dict[key];
- if (key != 'weight_order' && key != 'lr') {
- if (!key || !sklearn.Utility.isTensor(value)) {
- return null;
- }
- weights.set(key, value);
- }
- }
- return weights;
- }
- }
- }
- for (const key of keys) {
- const list = key === '' ? obj : obj[key];
- if (list && Array.isArray(list)) {
- const weights = new Map();
- for (let i = 0; i < list.length; i++) {
- const value = list[i];
- if (!sklearn.Utility.isTensor(value, 'numpy.ndarray')) {
- return null;
- }
- weights.set(i.toString(), value);
- }
- return weights;
- }
- }
- return null;
- }
- };
- sklearn.Error = class extends Error {
- constructor(message) {
- super(message);
- this.name = 'Error loading scikit-learn model.';
- }
- };
- if (typeof module !== 'undefined' && typeof module.exports === 'object') {
- module.exports.ModelFactory = sklearn.ModelFactory;
- }
|