T2TFNN.h 1.72 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61
/* NiuTrans.Tensor - an open-source tensor library
 * Copyright (C) 2018, Natural Language Processing Lab, Northestern University. 
 * All rights reserved.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

/*
 * $Created by: XIAO Tong (xiaotong@mail.neu.edu.cn) 2018-07-31
 */

#ifndef __T2TFNN_H__
#define __T2TFNN_H__

#include "../../tensor/XTensor.h"

using namespace nts;

namespace transformer
{

/* a fnn: y = max(0, x * w1 + b1) * w2 + b2 */
class T2TFNN
{
public:
    /* device id */
    int devID;

    /* memory pool */
    XMem * mem;

    /* size of input vector */
    int inSize;

    /* size of output vector */
    int outSize;

    /* size of hidden layers */
    int hSize;

    /* matrix of transformation 1 */
    XTensor w1;

    /* bias of transformation 1 */
    XTensor b1;

    /* matrix of transformation 2 */
    XTensor w2;

    /* bias of transformation 2 */
    XTensor b2;
62 63 64
    
    /* dropout probability */
    DTYPE dropoutP;
65 66 67 68 69 70 71 72 73 74

public:

    /* constructor */
    T2TFNN();

    /* deconstructor */
    ~T2TFNN();

    /* initialize the model */
75
    void InitModel(int argc, char ** argv, int myDevID = -1, XMem * myMem = NULL);
76

77
    /* make the network */
78
    XTensor Make(XTensor &input, bool isTraining);
79

80 81 82 83
};

}

84
#endif