T2TEmbedding.h 1.91 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
/* NiuTrans.Tensor - an open-source tensor library
 * Copyright (C) 2018, Natural Language Processing Lab, Northestern University. 
 * All rights reserved.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

/*
 * $Created by: XIAO Tong (xiaotong@mail.neu.edu.cn) 2018-08-01
 */

#ifndef __T2TEMBEDDING_H__
#define __T2TEMBEDDING_H__

#include "../../network/XNet.h"

using namespace nts;

namespace transformer
{

xiaotong committed
32
#define DEFAULT_EMBEDDING_SIZE 512
33

34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52
/* 
embedding (of word at position i):
word embedding + positional embedding
*/
class T2TEmbedder
{
public:
    /* device id */
    int devID;
    
    /* memory pool */
    XMem * mem;
    
    /* vocabulary size */
    int vSize;

    /* embedding size */
    int eSize;

53 54 55
    /* maximum length of the sequence */
    int maxLength;

xiaotong committed
56 57 58
    /* dimension size of the hidden layers in the t2t model */
    int d;

59 60 61 62 63
    /* word embedding matrix */
    XTensor w;

    /* predefined positional embeddings. It can speeds up 
       the embedding processing by re-loading. */
64 65
    XTensor posEmbeddingBase;

66 67 68 69 70 71 72 73
public:
    /* constructor */
    T2TEmbedder();

    /* de-constructor */
    ~T2TEmbedder();

    /* initialize the model */
74
    void InitModel(int argc, char ** argv, int myDevID = -1, XMem * myMem = NULL, bool isEnc = true);
75 76 77 78 79

    /* make positional embeddings */
    void MakePosEmbedding(int eSize, int d, int length);

    /* make the network */
xiaotong committed
80
    XTensor Make(XTensor &input);
81 82 83 84 85
};

}

#endif