// colab link: [...] function MnistRNN() { var model = this; this.weights_meta = { '(MnistNet).dropout(Dropout).keygen(Generator)._key': [[1973249, 1973251], [2]], '(MnistNet).lstm_core(LSTMCore).fc(Linear).b': [[266496, 268544], [2048]], '(MnistNet).lstm_core(LSTMCore).fc(Linear).w': [[268544, 1841408], [768, 2048]], '(MnistNet).output_head(Linear).b': [[1841408, 1841665], [257]], '(MnistNet).output_head(Linear).w': [[1841665, 1973249], [512, 257]], '(MnistNet).pos_embed(Embed).embeddings': [[0, 200704], [784, 256]], '(MnistNet).value_embed(Embed).embeddings': [[200704, 266496], [257, 256]] }; this.is_model_ready = false; this.embed_lookup = function(index, weights) { return tf.slice(weights, [index], [1]); }; this.pos = 0; this.state = null; this.start_token = 256; this.hidden_size = this.weights_meta['(MnistNet).lstm_core(LSTMCore).fc(Linear).b'][1][0] / 4; this.initialize_state = function() { this.pos = 0; this.token = this.start_token; var hidden = tf.zeros([1, this.hidden_size]); var cell = tf.zeros([1, this.hidden_size]); this.state = [hidden, cell]; }; this.lstm_core = function(inputs, state, weights) { const [hidden, cell] = state; const [w, b] = weights; const i_and_h =tf.concat([inputs, hidden], 1); const gated = tf.add(tf.matMul(i_and_h, w), b); const [i, g, f, o] = tf.split(gated, 4, 1); const f_ = tf.sigmoid(tf.add(f, 1.)); const i_ = tf.sigmoid(i); const g_ = tf.tanh(g); const c = tf.add( tf.mul(i_, g_), tf.mul(cell, f_) ); const h = tf.mul( tf.sigmoid(o), tf.tanh(c) ); return [h, c]; }; this.step = function() { const [token, h, c] = tf.tidy( function() { const lstm_b = model.MODEL_WEIGHTS['(MnistNet).lstm_core(LSTMCore).fc(Linear).b']; const lstm_w = model.MODEL_WEIGHTS['(MnistNet).lstm_core(LSTMCore).fc(Linear).w']; const output_b = model.MODEL_WEIGHTS['(MnistNet).output_head(Linear).b']; const output_w = model.MODEL_WEIGHTS['(MnistNet).output_head(Linear).w']; const pos_embed = model.MODEL_WEIGHTS['(MnistNet).pos_embed(Embed).embeddings']; const value_embed = model.MODEL_WEIGHTS['(MnistNet).value_embed(Embed).embeddings']; const v = model.embed_lookup(model.token, value_embed); const p = model.embed_lookup(model.pos, pos_embed); const x = tf.add(v, p); const [h, c] = model.lstm_core(x, model.state, [lstm_w, lstm_b]); tf.dispose(model.state[0]); tf.dispose(model.state[1]); const logits = tf.add( tf.matMul(h, output_w), output_b ); const token = tf.multinomial(logits, 1).dataSync()[0]; return [token, h, c]; }); this.clean_memory(); this.token = token; this.state = [h, c]; canvas.plot_xyc(this.pos, token); this.pos = this.pos + 1; }; this.MODEL_WEIGHTS = {}; this.clean_memory = function() { tf.dispose(model.state[0]); tf.dispose(model.state[1]); }; this.loop = function() { this.step(); if (this.pos >=28*28) { setTimeout(function(){ model.clean_memory(); model.initialize_state(); canvas.plot_grid(); model.loop(); }, 3000); } else { canvas.plot_xyc(this.pos, 255); setTimeout(function(){model.loop();}, 0); } }; this.load_model_weights = function() { var req = new XMLHttpRequest(); req.open("GET", "weights.bin", true); console.log('loading weights...'); req.responseType = "arraybuffer"; var this_ = this; req.onload = function (event) { var buff = req.response; if (buff) { var W = new Float32Array(buff); for(var k in this_.weights_meta) { info = this_.weights_meta[k]; offset = info[0]; shape = info[1]; this_.MODEL_WEIGHTS[k] = tf.tensor(W.subarray(offset[0], offset[1]), shape); } this_.is_model_ready = true; } else { alert('Error while loading weights...'); } }; req.send(null); }; this.load_when_ready = function() { tf.ready().then( function() { tf.enableProdMode(); console.log('tf is ready'); model.initialize_state() model.load_model_weights(); console.log(model.hidden_size); }); }; } function MnistCanvas() { var canvas = document.getElementById("mnist-canvas"); canvas.width = window.innerWidth; canvas.height = window.innerHeight; context=canvas.getContext('2d'); context.translate(canvas.width/2,canvas.height/2); var scale = Math.floor(Math.min(canvas.width, canvas.height) / (28*2) ) * 28; console.log(scale); context.scale(scale, scale) context.imageSmoothingEnabled = false; this.clear = function() { context.clearRect(-1, -1, 2., 2.); context.fillStyle = "rgb(0, 0, 0)"; context.fillRect(-10, -10, 20, 20); }; this.plot_grid = function() { for (var i=0; i< 28*28; i++) this.plot_xyc(i, 0); }; this.plot_xyc = function (pos, color) { color = Math.max(20, color); var step = 1. / 28; var y = Math.floor(pos / 28 - 14) * step; var x = (pos % 28 - 14) * step; context.fillStyle = "rgb(0, " + color + ", 0)"; context.fillRect(x, y, step, step); context.strokeStyle = "rgb(0, 0, 0)"; context.lineWidth = 0.008; context.strokeRect(x, y, step, step); }; this.loading_animation = function() { var counter = 0; var this_ = this; this_.plot_grid(); var draw = function() { if (model.is_model_ready) { console.log('stopping animation.'); model.loop(); return; } if (counter >= 28*28) { this_.plot_grid(); counter = 0; } this_.plot_xyc(counter, 255); if (counter < 28*28-1) { this_.plot_xyc(counter+1, 255); } counter = counter+1; window.requestAnimationFrame(draw); }; window.requestAnimationFrame(draw); }; } var model = null; var canvas = null; window.onload = function() { setTimeout(function() { model = new MnistRNN(); canvas = new MnistCanvas(); console.log("init..."); canvas.clear(); canvas.loading_animation(); model.load_when_ready(); }, 500); };