@tensorflow/tfjs-layers
Version:
TensorFlow layers API in JavaScript
103 lines • 13.2 kB
JavaScript
/**
* @license
* Copyright 2023 Google LLC.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* =============================================================================
*/
/**
* Position embedding implementation based on `tf.layers.Layer`.
*/
/* Original source: keras_nlp/layers/modeling/position_embedding.py */
import { serialization, tidy } from '@tensorflow/tfjs-core';
import { Layer } from '../../../engine/topology';
import { ValueError } from '../../../errors';
import { getInitializer, serializeInitializer } from '../../../initializers';
import { getExactlyOneTensor } from '../../../utils/types_utils';
/**
* A layer which learns a position embedding for input sequences.
*
* This class assumes that in the input tensor, the last dimension corresponds
* to the features, and the dimension before the last corresponds to the
* sequence.
*
* Examples:
*
* Called directly on input.
* ```js
* const layer = new PositionEmbedding({sequenceLength=10});
* layer.call(tf.zeros([8, 10, 16]));
* ```
*
* Combine with a token embedding.
* ```js
* const seqLength = 50;
* const vocabSize = 5000;
* const embedDim = 128;
* const inputs = tf.input({shape: [seqLength]});
* const tokenEmbeddings = tf.layers.embedding({
* inputDim=vocabSize, outputDim=embedDim
* }).apply(inputs);
* const positionEmbeddings = new PositionEmbedding({
* sequenceLength: seqLength
* }).apply(tokenEmbeddings);
* const outputs = tf.add(tokenEmbeddings, positionEmbeddings);
* ```
*
* Reference:
* - [Devlin et al., 2019](https://arxiv.org/abs/1810.04805)
*/
class PositionEmbedding extends Layer {
constructor(args) {
super(args);
if (args.sequenceLength == null) {
throw new ValueError('`sequenceLength` must be an Integer, received `null`.');
}
this.sequenceLength = args.sequenceLength;
this.initializer = getInitializer(args.initializer || 'glorotUniform');
}
getConfig() {
const config = {
'sequenceLength': this.sequenceLength,
'initializer': serializeInitializer(this.initializer),
};
const baseConfig = super.getConfig();
Object.assign(config, baseConfig);
return config;
}
build(inputShape) {
const featureSize = inputShape[inputShape.length - 1];
this.positionEmbeddings = this.addWeight('embeddings', [this.sequenceLength, featureSize], null, this.initializer, null, true);
super.build(inputShape);
}
call(inputs, kwargs) {
return tidy(() => {
var _a;
kwargs.startIndex = (_a = kwargs.startIndex) !== null && _a !== void 0 ? _a : 0;
const shape = getExactlyOneTensor(inputs).shape;
const featureLength = shape[shape.length - 1];
const sequenceLength = shape[shape.length - 2];
// trim to match the length of the input sequence, which might be less
// than the sequence_length of the layer.
const positionEmbeddings = this.positionEmbeddings.read().slice([kwargs.startIndex, 0], [sequenceLength, featureLength]);
return positionEmbeddings.broadcastTo(shape);
});
}
computeOutputShape(inputShape) {
return inputShape;
}
}
/** @nocollapse */
PositionEmbedding.className = 'PositionEmbedding';
export { PositionEmbedding };
serialization.registerClass(PositionEmbedding);
//# sourceMappingURL=data:application/json;base64,