UNPKG

@tensorflow/tfjs-layers

Version:

TensorFlow layers API in JavaScript

103 lines 13.2 kB
/** * @license * Copyright 2023 Google LLC. * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ============================================================================= */ /** * Position embedding implementation based on `tf.layers.Layer`. */ /* Original source: keras_nlp/layers/modeling/position_embedding.py */ import { serialization, tidy } from '@tensorflow/tfjs-core'; import { Layer } from '../../../engine/topology'; import { ValueError } from '../../../errors'; import { getInitializer, serializeInitializer } from '../../../initializers'; import { getExactlyOneTensor } from '../../../utils/types_utils'; /** * A layer which learns a position embedding for input sequences. * * This class assumes that in the input tensor, the last dimension corresponds * to the features, and the dimension before the last corresponds to the * sequence. * * Examples: * * Called directly on input. * ```js * const layer = new PositionEmbedding({sequenceLength=10}); * layer.call(tf.zeros([8, 10, 16])); * ``` * * Combine with a token embedding. * ```js * const seqLength = 50; * const vocabSize = 5000; * const embedDim = 128; * const inputs = tf.input({shape: [seqLength]}); * const tokenEmbeddings = tf.layers.embedding({ * inputDim=vocabSize, outputDim=embedDim * }).apply(inputs); * const positionEmbeddings = new PositionEmbedding({ * sequenceLength: seqLength * }).apply(tokenEmbeddings); * const outputs = tf.add(tokenEmbeddings, positionEmbeddings); * ``` * * Reference: * - [Devlin et al., 2019](https://arxiv.org/abs/1810.04805) */ class PositionEmbedding extends Layer { constructor(args) { super(args); if (args.sequenceLength == null) { throw new ValueError('`sequenceLength` must be an Integer, received `null`.'); } this.sequenceLength = args.sequenceLength; this.initializer = getInitializer(args.initializer || 'glorotUniform'); } getConfig() { const config = { 'sequenceLength': this.sequenceLength, 'initializer': serializeInitializer(this.initializer), }; const baseConfig = super.getConfig(); Object.assign(config, baseConfig); return config; } build(inputShape) { const featureSize = inputShape[inputShape.length - 1]; this.positionEmbeddings = this.addWeight('embeddings', [this.sequenceLength, featureSize], null, this.initializer, null, true); super.build(inputShape); } call(inputs, kwargs) { return tidy(() => { var _a; kwargs.startIndex = (_a = kwargs.startIndex) !== null && _a !== void 0 ? _a : 0; const shape = getExactlyOneTensor(inputs).shape; const featureLength = shape[shape.length - 1]; const sequenceLength = shape[shape.length - 2]; // trim to match the length of the input sequence, which might be less // than the sequence_length of the layer. const positionEmbeddings = this.positionEmbeddings.read().slice([kwargs.startIndex, 0], [sequenceLength, featureLength]); return positionEmbeddings.broadcastTo(shape); }); } computeOutputShape(inputShape) { return inputShape; } } /** @nocollapse */ PositionEmbedding.className = 'PositionEmbedding'; export { PositionEmbedding }; serialization.registerClass(PositionEmbedding); //# sourceMappingURL=data:application/json;base64,