[
    [
        [
            "layers.Conv2D(128, 3) # input_shape = (64, 64, 3) by default",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2D(128, 3) # input_shape = (64, 64, 3) by default"
        ],
        [
            "layers.Conv2D(dim_out, 3, 2, padding='same')\n\n",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2D(dim_out, 3, 2, padding='same')\n\n"
        ],
        [
            "layers.Activation('relu')",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "Activation('relu')"
        ],
        [
            "layers.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1)"
        ],
        [
            "layers.Dense(dim_out)",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Dense(dim_out)"
        ],
        [
            "\n",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "\n"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "max_len = 512\nself.embed_tokens = Embedding(n_words, dim_emb)\n\ndim_emb*2, dim_emb*2\n\ndef create_segment_list(batch_size=1, max_",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "max_len = 512\nself.embed_tokens = Embedding(n_words, dim_emb)\n\ndim_emb*2, dim_emb*2\n\ndef create_segment_list(batch_size=1, max_"
        ],
        [
            "layers.MaxPool2D(pool_size=2, strides=2)\n\n",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPool2D(pool_size=2, strides=2)\n\n"
        ],
        [
            "self.bn1 = layers.BatchNormalization(momentum=0.8, axis=-1)\nself.act1 = layers.LeakyReLU()\nself.conv1 = layers.Conv2D(dim, 3, padding='same')\nself.pool1 = layers.MaxPooling2D(pool_size=3, strides=2, input_shape=(img_w//2, img_h//2, dim))\n\nself.norm1 = layers.LayerNormalization()\n\nself.pool1 = L\nself.embed = nn.Embed(vocab_size, dim_emb, scale_",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(momentum=0.8, axis=-1)\nself.act1 = layers.LeakyReLU()\nself.conv1 = layers.Conv2D(dim, 3, padding='same')\nself.pool1 = layers.MaxPooling2D(pool_size=3, strides=2, input_shape=(img_w//2, img_h//2, dim))\n\nself.norm1 = layers.LayerNormalization()\n\nself.pool1 = L\nself.embed = nn.Embed(vocab_size, dim_emb, scale_"
        ],
        [
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3, padding='same', activation='relu')\nself.pool1 = layers.MaxPooling2D(pool_size=(2, 2))\n\n############\n\nf.shape\n[*, seq_len*2]\n\nimport requests\nimport json\n\nurl = 'http://reu.ms.mff.cuni.cz/api/sparql/query-via-url'\npreference = 'text/csv'\nquery = \"\"\"\n    PREFIX lip",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3, padding='same', activation='relu')\nself.pool1 = layers.MaxPooling2D(pool_size=(2, 2))\n\n############\n\nf.shape\n[*, seq_len*2]\n\nimport requests\nimport json\n\nurl = 'http://reu.ms.mff.cuni.cz/api/sparql/query-via-url'\npreference = 'text/csv'\nquery = \"\"\"\n    PREFIX lip"
        ],
        [
            "layers.LayerNormalization()\n\n",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "LayerNormalization()\n\n"
        ],
        [
            "layers.LeakyReLU()",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU()"
        ],
        [
            "layers.LSTM(512)",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "LSTM(512)"
        ],
        [
            "tf.concat([states], -1)\n\n\n\n\n\n\n\n\n\n\n\n   \n\n\n\n\n\n\n\n\n\n\n\n",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "concat([states], -1)\n\n\n\n\n\n\n\n\n\n\n\n   \n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "tf.nn.log_softmax(logits, axis=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "log_softmax(logits, axis=-1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)"
        ],
        [
            "tf.reshape(x, [batch_size, 1, -1]) # Will be merged into [batch_size, 1, -1] dimensions",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, 1, -1]) # Will be merged into [batch_size, 1, -1] dimensions"
        ],
        [
            "layers.MultiHeadAttention(head_num=num_heads, dropout=attn_dropout, name='Multi_Head_Attention')  # No embed_dim arg.\n\n",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiHeadAttention(head_num=num_heads, dropout=attn_dropout, name='Multi_Head_Attention')  # No embed_dim arg.\n\n"
        ],
        [
            "self.attn = layers.MultiHeadAttention(w_dim=args.d_model, h=args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = Sequential([\n            layers.LayerNormalization(args.d_model),\n            layers.Dropout(args.dropout)\n        ])",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "self.attn = layers.MultiHeadAttention(w_dim=args.d_model, h=args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = Sequential([\n            layers.LayerNormalization(args.d_model),\n            layers.Dropout(args.dropout)\n        ])"
        ],
        [
            "\n",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "\n"
        ],
        [
            "x = self.classifier(x)\nreturn layers.Activation('softmax')(x)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "x = self.classifier(x)\nreturn layers.Activation('softmax')(x)"
        ],
        [
            "\n",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "\n"
        ],
        [
            "\n    \n\n    \n\n    \n\n    \n\n    \n\n    \n\n    \n\n    \n\n    ",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "\n    \n\n    \n\n    \n\n    \n\n    \n\n    \n\n    \n\n    \n\n    "
        ],
        [
            "x = self.ffn1(x)\nx = x + self.drop(y)\n\n######################################################################\n\nhelp(TextCNN)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "x = self.ffn1(x)\nx = x + self.drop(y)\n\n######################################################################\n\nhelp(TextCNN)"
        ],
        [
            "self.bn1 = layers.BatchNormalization(\n    axis=-1, momentum=0.99, epsilon=0.001, center=True, scale=True\n)\nself.act1 = activation\nself.conv1 = layers.Conv2D(\n    filters=dim,\n    kernel_size=(3, 3),\n    strides=1,\n    padding=\"same\",\n    data_format=\"channels_last\",\n    dilation_rate=1,",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(\n    axis=-1, momentum=0.99, epsilon=0.001, center=True, scale=True\n)\nself.act1 = activation\nself.conv1 = layers.Conv2D(\n    filters=dim,\n    kernel_size=(3, 3),\n    strides=1,\n    padding=\"same\",\n    data_format=\"channels_last\",\n    dilation_rate=1,"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.MaxPool2D(pool_size=3, strides=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPool2D(pool_size=3, strides=2)"
        ],
        [
            "\n        if self.dim == 1024:\n\n          self.fc = PipelinedClassifier",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "\n        if self.dim == 1024:\n\n          self.fc = PipelinedClassifier"
        ],
        [
            "layers.Conv2D(input_channels=128, filters=512, strides=2, kernel_size=5, use_bias=False)\n\n",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2D(input_channels=128, filters=512, strides=2, kernel_size=5, use_bias=False)\n\n"
        ]
    ],
    [
        [
            "layers.Conv2D(128, 3)",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2D(128, 3)"
        ],
        [
            "layers.Conv2D(dim_out, 3, strides=2, padding=\"same\")",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2D(dim_out, 3, strides=2, padding=\"same\")"
        ],
        [
            "layers.ReLU()",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "ReLU()"
        ],
        [
            "layers.Dropout(0.1)\n\n",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1)\n\n"
        ],
        [
            "layers.Dense(dim_out)",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Dense(dim_out)"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim)\n\n",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim)\n\n"
        ],
        [
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb)\n\nfor name, module in self.layers.named_children():\n    module.wdrop = (0.3 if name",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb)\n\nfor name, module in self.layers.named_children():\n    module.wdrop = (0.3 if name"
        ],
        [
            "layers.MaxPool2D(pool_size=2, strides=2)",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPool2D(pool_size=2, strides=2)"
        ],
        [
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(alpha=0.2)\nself.conv1 = layers.Conv2D(dim, 3, padding=\"same\")\nself.pool1 = layers.MaxPool2D(2)\n\ndef preprocess(text):\n    '''\n    Removes punctuation and digits from a string, and converts all characters to lowercase. \n    Also clears all \\n and hyphens (splits hyphenated words into two words).\n    \n    '''\n        \n    preprocessed_text = text.lower().replace('",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(alpha=0.2)\nself.conv1 = layers.Conv2D(dim, 3, padding=\"same\")\nself.pool1 = layers.MaxPool2D(2)\n\ndef preprocess(text):\n    '''\n    Removes punctuation and digits from a string, and converts all characters to lowercase. \n    Also clears all \\n and hyphens (splits hyphenated words into two words).\n    \n    '''\n        \n    preprocessed_text = text.lower().replace('"
        ],
        [
            "self.bn1 = tf.keras.layers.BatchNormalization()\nself.act1 = tf.keras.layers.Activation('relu')\nself.conv1 = BasicConv2D(num_channels)\nself.pool1 = layers.AveragePooling1D(pool_size=2, strides=2)\n\n    \n    \n    \n    \n    \n    \n    \n    \n    \n    \n    \n    ########################################################################################\n    ## PyTorch:\n    def compute_average(self, hiddens_middle, lengths):\n        \"\"\"Computes an average of a list of RNN states. Used",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "self.bn1 = tf.keras.layers.BatchNormalization()\nself.act1 = tf.keras.layers.Activation('relu')\nself.conv1 = BasicConv2D(num_channels)\nself.pool1 = layers.AveragePooling1D(pool_size=2, strides=2)\n\n    \n    \n    \n    \n    \n    \n    \n    \n    \n    \n    \n    ########################################################################################\n    ## PyTorch:\n    def compute_average(self, hiddens_middle, lengths):\n        \"\"\"Computes an average of a list of RNN states. Used"
        ],
        [
            "layers.BatchNormalization() #FIXME: Arguments?",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "BatchNormalization() #FIXME: Arguments?"
        ],
        [
            "layers.LeakyReLU(leaky = args.leaky)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU(leaky = args.leaky)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.LSTMSequence(512, 512, recurrent_dropout=0.1)",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "LSTMSequence(512, 512, recurrent_dropout=0.1)"
        ],
        [
            "tf.concat(states, -1)",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "concat(states, -1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)"
        ],
        [
            "tf.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "layers.MultiHeadAttention(embed_dim=model_dim, attention_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiHeadAttention(embed_dim=model_dim, attention_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = Transformer(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization()\n\nprint('Section converted')\nloss_fake = out.loss_\npred_fake = out.pred_\nloss_cls = pred_fake\n\npeaks, _ = signal.find_peaks(loss_cls, threshold=thresh)\nplt.plot(loss_cls)\nplt.plot(peaks, loss_cl",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "self.attn = Transformer(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization()\n\nprint('Section converted')\nloss_fake = out.loss_\npred_fake = out.pred_\nloss_cls = pred_fake\n\npeaks, _ = signal.find_peaks(loss_cls, threshold=thresh)\nplt.plot(loss_cls)\nplt.plot(peaks, loss_cl"
        ],
        [
            "\n         self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n\n\n         #if args.dropout > 0 or args.recurrent_dropout > 0:\n\n         #           self.rnn = layers.wrappers.Bidirectional(self.rnn, merge_mode=args.",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "\n         self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n\n\n         #if args.dropout > 0 or args.recurrent_dropout > 0:\n\n         #           self.rnn = layers.wrappers.Bidirectional(self.rnn, merge_mode=args."
        ],
        [
            "return tf.nn.softmax(x)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "return tf.nn.softmax(x)"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n                                                        # ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;                        ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;                    ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;     ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n                                                        # ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;                        ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;                    ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;     ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;"
        ],
        [
            "\n",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "\n"
        ],
        [
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\nclass Block(layers.Layer):\n      def __init__(self, num_channels, kernel_size=3",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\nclass Block(layers.Layer):\n      def __init__(self, num_channels, kernel_size=3"
        ],
        [
            "self.bn1 = layers.BatchNormalization(axis=1)\nself.act1 = activations.get('relu')\nself.conv1 = layers.Conv2D(filters=dim, strides=2, kernel_size=3, padding='same')\nself.pool1 = layers.MaxPooling2D(pool_size=3, strides=2)\n\n###################################################################################\n###############              PyTorch Transformer   #################################\n################################################################################",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(axis=1)\nself.act1 = activations.get('relu')\nself.conv1 = layers.Conv2D(filters=dim, strides=2, kernel_size=3, padding='same')\nself.pool1 = layers.MaxPooling2D(pool_size=3, strides=2)\n\n###################################################################################\n###############              PyTorch Transformer   #################################\n################################################################################"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.MaxPooling2D(pool_size=3,strides=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPooling2D(pool_size=3,strides=2)"
        ],
        [
            "\n    def __init__(self, units, name=None, **kwargs):\n\n",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "\n    def __init__(self, units, name=None, **kwargs):\n\n"
        ],
        [
            "layers.Conv2D(filters=512, input_shape=in_channels, kernel_size=5, strides=2, padding='same')",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2D(filters=512, input_shape=in_channels, kernel_size=5, strides=2, padding='same')"
        ]
    ],
    [
        [
            "layers.Conv2D(128, 3)",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2D(128, 3)"
        ],
        [
            "layers.Conv2D(filters=dim_out, kernel_size=3, strides=2, activation='relu')",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2D(filters=dim_out, kernel_size=3, strides=2, activation='relu')"
        ],
        [
            "layers.Activation(tf.nn.sigm",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "Activation(tf.nn.sigm"
        ],
        [
            "layers.Dropout(0.1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.Dense(dim_out)       # specify activate functions when instantiated the layer",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Dense(dim_out)       # specify activate functions when instantiated the layer"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "inputs = Input(shape=(512, ))\nembed = Embedding(n_words, dim_emb)(inputs)\n\nclass Generator(nn.Module):\n    def __init__(self, dim_emb, dim_hid, n_layer",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "inputs = Input(shape=(512, ))\nembed = Embedding(n_words, dim_emb)(inputs)\n\nclass Generator(nn.Module):\n    def __init__(self, dim_emb, dim_hid, n_layer"
        ],
        [
            "layers.MaxPool2D(pool_size=2, strides=2)",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPool2D(pool_size=2, strides=2)"
        ],
        [
            "self.bn1 = layers.BatchNormalization(dim)\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3, data_format='channels_first')\nself.pool1 = layers.MaxPooling2D(3, 2, data_format='channels_first')\n\ndef calc_padding(dilation, kernel, stride):\n    \"\"\"Calculate the padding required for same convolutions.\"\"\"\n    return (dilation * (kernel-1) - stride + 1) // 2\n\n###################\nimport numpy as np\n",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(dim)\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3, data_format='channels_first')\nself.pool1 = layers.MaxPooling2D(3, 2, data_format='channels_first')\n\ndef calc_padding(dilation, kernel, stride):\n    \"\"\"Calculate the padding required for same convolutions.\"\"\"\n    return (dilation * (kernel-1) - stride + 1) // 2\n\n###################\nimport numpy as np\n"
        ],
        [
            "self.bn1 = tf.keras.layers.BatchNormalization(scale=True, center=False)\nself.act1 = tf.keras.layers.Activation(\"relu\")\nself.conv1 = layers.Conv2D(num_channels, 3, data_format=\"channels_last\")\nself.pool1 = layers.AveragePooling2D(2, 2)\n\nfor i, layer in enumerate(layers):\n    W1.append(model.nn.Linear(model_dim, model_dim).to(device).double())\n    W2.append(model.nn.Linear(model",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "self.bn1 = tf.keras.layers.BatchNormalization(scale=True, center=False)\nself.act1 = tf.keras.layers.Activation(\"relu\")\nself.conv1 = layers.Conv2D(num_channels, 3, data_format=\"channels_last\")\nself.pool1 = layers.AveragePooling2D(2, 2)\n\nfor i, layer in enumerate(layers):\n    W1.append(model.nn.Linear(model_dim, model_dim).to(device).double())\n    W2.append(model.nn.Linear(model"
        ],
        [
            "layers.LayerNormalization(axis=dim)",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "LayerNormalization(axis=dim)"
        ],
        [
            "layers.LeakyReLU(args.leaky)\n\n\n\n\n\n\n\n\n\n\n\n",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU(args.leaky)\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.LSTM(512, dropout=0.1)",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "LSTM(512, dropout=0.1)"
        ],
        [
            "tf.concat(states, axis=-1)",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "concat(states, axis=-1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)"
        ],
        [
            "tf.nn.softmax()",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax()"
        ],
        [
            "tf.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "layers.MultiHeadAttention(max_sequence_length=hparam.max_length, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiHeadAttention(max_sequence_length=hparam.max_length, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = layers.MultiHeadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\nclass TransformerED(nn.Module):\n    def __init__(self, d_model, n_heads, dropout, dropout_att):\n        \"Helper class for encapsulating the Transformer structure.\"\n        super(TransformerED, self).__init__()\n        \n        # Instantiate multi",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "self.attn = layers.MultiHeadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\nclass TransformerED(nn.Module):\n    def __init__(self, d_model, n_heads, dropout, dropout_att):\n        \"Helper class for encapsulating the Transformer structure.\"\n        super(TransformerED, self).__init__()\n        \n        # Instantiate multi"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "x = self.classifier(x)\nreturn keras.layers.Softmax()(x)\n\nnn.TransformerEncoderLayer(d_model=hidden_dim, nhead=2, dim",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "x = self.classifier(x)\nreturn keras.layers.Softmax()(x)\n\nnn.TransformerEncoderLayer(d_model=hidden_dim, nhead=2, dim"
        ],
        [
            "\n  x = K.reshape(x, (-1, 24 * 64))    # or x = K.reshape(x, (-1, 24 * model_dim))\n\n  y = K.reshape(y, (-1, 24 * 64))    # or y = K.reshape(x, (-1, 24 * model_dim))\n\n ",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "\n  x = K.reshape(x, (-1, 24 * 64))    # or x = K.reshape(x, (-1, 24 * model_dim))\n\n  y = K.reshape(y, (-1, 24 * 64))    # or y = K.reshape(x, (-1, 24 * model_dim))\n\n "
        ],
        [
            "\n  # Create 2 conv layers with 64 channels and 5*5 kernels. Example:",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "\n  # Create 2 conv layers with 64 channels and 5*5 kernels. Example:"
        ],
        [
            "x = layers.Dropout(0.1)(layers.Activation('relu')(layers.Dense(self.ffn1, units=x.shape[1])(x)))\nx = layers.Dropout(0.1)(layers.Add()([x",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "x = layers.Dropout(0.1)(layers.Activation('relu')(layers.Dense(self.ffn1, units=x.shape[1])(x)))\nx = layers.Dropout(0.1)(layers.Add()([x"
        ],
        [
            "self.bn1 = BatchNormalization(dim)\nself.act1 = Activation()\nself.conv1 = Conv2D(start_filters, 3, padding='same')\nself.pool1 = MaxPooling2D(pool_size=(3, 2))\n\nself.layer_1 = layers.Conv2D(filters=128, kernel_size=3, strides=1)\nself.layer_2 = layers.MaxPool2D(pool_size",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = BatchNormalization(dim)\nself.act1 = Activation()\nself.conv1 = Conv2D(start_filters, 3, padding='same')\nself.pool1 = MaxPooling2D(pool_size=(3, 2))\n\nself.layer_1 = layers.Conv2D(filters=128, kernel_size=3, strides=1)\nself.layer_2 = layers.MaxPool2D(pool_size"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.MaxPooling1D(strides=2)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n # some defined layers etc. so that we can write",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPooling1D(strides=2)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n # some defined layers etc. so that we can write"
        ],
        [
            "\n\n\n\n\n\n\n  # ///////////////////////////////////////////////////////////////\n\n  # Blocks (used in src",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "\n\n\n\n\n\n\n  # ///////////////////////////////////////////////////////////////\n\n  # Blocks (used in src"
        ],
        [
            "layers.Conv2D(filters=512, kernel_size=5, strides=2, use_bias=False)",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2D(filters=512, kernel_size=5, strides=2, use_bias=False)"
        ]
    ],
    [
        [
            "layers.Conv2D(64, (3, 3))",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2D(64, (3, 3))"
        ],
        [
            "layers.Conv2D(dim_out, 3, 2, padding='same')  # multi-channel 2D convolution layer using strides=2 and zero padding to add up",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2D(dim_out, 3, 2, padding='same')  # multi-channel 2D convolution layer using strides=2 and zero padding to add up"
        ],
        [
            "layers.ReLU()",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "ReLU()"
        ],
        [
            "layers.Dropout(0.1, noise_shape=(1, 1, 100))",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1, noise_shape=(1, 1, 100))"
        ],
        [
            "layers.Dense(dim_out)",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Dense(dim_out)"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim)\n\n",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim)\n\n"
        ],
        [
            "self.embed_tokens = layers.Embedding(embed_dim=dim_emb, input_dim=n_words)\nself.embed_scale = math.sqrt(args.d_model)\n\nself.pos_embed = Sin",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "self.embed_tokens = layers.Embedding(embed_dim=dim_emb, input_dim=n_words)\nself.embed_scale = math.sqrt(args.d_model)\n\nself.pos_embed = Sin"
        ],
        [
            "layers.MaxPooling2D(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPooling2D(2, 2)"
        ],
        [
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\ndef gamma_transform(parameters, gamma):\n    parameters = copy.deepcopy(parameters)\n    normalization = get_normalization(parameters)\n    for module in normalization.modules():\n        if isinstance(module, nn.modules.batchnorm._BatchNorm):\n            gamma_tensor =",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\ndef gamma_transform(parameters, gamma):\n    parameters = copy.deepcopy(parameters)\n    normalization = get_normalization(parameters)\n    for module in normalization.modules():\n        if isinstance(module, nn.modules.batchnorm._BatchNorm):\n            gamma_tensor ="
        ],
        [
            "self.bn1 = layers.BatchNormalization(momentum=0.99, epsilon=0.001, center=True, scale=True,\n                                     beta_initializer='zeros', gamma_initializer='ones',\n                                     moving_mean_initializer='zeros',\n                                     moving_variance_initializer='ones')(self.conv1)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(filters=num_channels, kernel_size=(3, 3), strides=(1, 1), padding='same',\n                           use_bias=False)(self.bn",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(momentum=0.99, epsilon=0.001, center=True, scale=True,\n                                     beta_initializer='zeros', gamma_initializer='ones',\n                                     moving_mean_initializer='zeros',\n                                     moving_variance_initializer='ones')(self.conv1)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(filters=num_channels, kernel_size=(3, 3), strides=(1, 1), padding='same',\n                           use_bias=False)(self.bn"
        ],
        [
            "layers.normalization.BatchNormalization(axis=dim, e",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "normalization.BatchNormalization(axis=dim, e"
        ],
        [
            "layers.LeakyReLU(args.leaky)\"\"\"",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU(args.leaky)\"\"\""
        ],
        [
            "layers.GRU(512) #, dropout=0.1, recurrent_dropout=0.1)\n\n",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "GRU(512) #, dropout=0.1, recurrent_dropout=0.1)\n\n"
        ],
        [
            "tf.concat(states, axis=-1)",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "concat(states, axis=-1)"
        ],
        [
            "tf.nn.log_softmax(logits, axis=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "log_softmax(logits, axis=-1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)"
        ],
        [
            "tf.reshape(x, [batch_size, -1])\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, -1])\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.MultiHeadAttention(model_dim, num_heads, attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiHeadAttention(model_dim, num_heads, attn_dropout)"
        ],
        [
            "self.attn = MultiHeadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization()\n\n## translate things to be closer to pytorch\nattn_q = layers.Dense(dim_attn) \nattn_k = layers.Dense(dim_attn) \nattn_v = layers.Dense(dim_attn)\nff = layers.Dense(512)\nself.attn = Multi",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "self.attn = MultiHeadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization()\n\n## translate things to be closer to pytorch\nattn_q = layers.Dense(dim_attn) \nattn_k = layers.Dense(dim_attn) \nattn_v = layers.Dense(dim_attn)\nff = layers.Dense(512)\nself.attn = Multi"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "return tf.nn.softmax(x, axis=-1)\n\n\"\"\"\nloss = self.loss_fn(x, y_)\ntrainable_params = filter(lambda p: p.requires_grad",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "return tf.nn.softmax(x, axis=-1)\n\n\"\"\"\nloss = self.loss_fn(x, y_)\ntrainable_params = filter(lambda p: p.requires_grad"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n                                                                                         package_data={'image_loading': ['data/*.txt",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n                                                                                         package_data={'image_loading': ['data/*.txt"
        ],
        [
            "\n        x_pos, y_pos = tensorflow.unstack(pos",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "\n        x_pos, y_pos = tensorflow.unstack(pos"
        ],
        [
            "y = self.flatten(self.act1(self.dense1(self.conv1(self.pool1(self.bn1(x))))))\nx = x + self.drop(y)\n\n########################################################################################################################\n\nfrom torch import nn\nimport",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "y = self.flatten(self.act1(self.dense1(self.conv1(self.pool1(self.bn1(x))))))\nx = x + self.drop(y)\n\n########################################################################################################################\n\nfrom torch import nn\nimport"
        ],
        [
            "self.bn1 = layers.BatchNormalization(self.conv_dim)\nself.act1 = activation()\nself.conv1 = layers.Conv2D(dim, 3, strides=2, padding='same', use_bias=False)\nself.pool1 = layers.MaxPooling2D(pool_size=[3, 2])\n\n## Translate layer\n\nclass MultiheadAttention(tf1.keras.layers.Layer):\n\n    # Py",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(self.conv_dim)\nself.act1 = activation()\nself.conv1 = layers.Conv2D(dim, 3, strides=2, padding='same', use_bias=False)\nself.pool1 = layers.MaxPooling2D(pool_size=[3, 2])\n\n## Translate layer\n\nclass MultiheadAttention(tf1.keras.layers.Layer):\n\n    # Py"
        ],
        [
            "\n         x = Conv2D(planes, 3, strides=1, dilation_rate=2, padding='same', use_bias=False)(x)\n\n         x = BatchNormalization()(x)\n\n         x = Activation",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "\n         x = Conv2D(planes, 3, strides=1, dilation_rate=2, padding='same', use_bias=False)(x)\n\n         x = BatchNormalization()(x)\n\n         x = Activation"
        ],
        [
            "layers.MaxPooling1D(pool_size=3, strides=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPooling1D(pool_size=3, strides=2)"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.Conv2D(filters=512, kernel_size=5, strides=2, padding='valid', use_bias=False)",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2D(filters=512, kernel_size=5, strides=2, padding='valid', use_bias=False)"
        ]
    ],
    [
        [
            "layers.Conv2D(128, 3)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2D(128, 3)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.Conv2D([dim_in, 1, dim_out, 2], [3, 1])",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2D([dim_in, 1, dim_out, 2], [3, 1])"
        ],
        [
            "layers.ReLU()",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "ReLU()"
        ],
        [
            "layers.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1)"
        ],
        [
            "layers.Dense(dim_out)",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Dense(dim_out)"
        ],
        [
            "\n",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "\n"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim) # It takes an integer input, not one-hot encoding! \n\n",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim) # It takes an integer input, not one-hot encoding! \n\n"
        ],
        [
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb)\n\nself.embed_positions = PositionalEmbedding(\n    max_len, dim_emb, self.padding_",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb)\n\nself.embed_positions = PositionalEmbedding(\n    max_len, dim_emb, self.padding_"
        ],
        [
            "layers.MaxPool2D(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPool2D(2, 2)"
        ],
        [
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3, padding='same')\nself.pool1 = layers.MaxPool2D(3, 2, padding='same')",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3, padding='same')\nself.pool1 = layers.MaxPool2D(3, 2, padding='same')"
        ],
        [
            "layers.BatchNormalization()\nlayers.Activation('relu')\nlayers.Conv2D(num_channels, 3)\nlayers.AveragePooling2D(2)\n\nclass CustomLinear(tf.layers.Layer):\n    def __init__(self, units, activation=None, **kwargs):\n        super(CustomLinear, self).__init__(**kwargs)\n\n        # self.units = units\n        self.activation = activation\n        # self.activation = tf.nn.tanh if activation == 'tanh' else tf.nn.elu\n\n    def build(self, input_shape",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "layers.BatchNormalization()\nlayers.Activation('relu')\nlayers.Conv2D(num_channels, 3)\nlayers.AveragePooling2D(2)\n\nclass CustomLinear(tf.layers.Layer):\n    def __init__(self, units, activation=None, **kwargs):\n        super(CustomLinear, self).__init__(**kwargs)\n\n        # self.units = units\n        self.activation = activation\n        # self.activation = tf.nn.tanh if activation == 'tanh' else tf.nn.elu\n\n    def build(self, input_shape"
        ],
        [
            "layers.LayerNormalization(axis=-1)",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "LayerNormalization(axis=-1)"
        ],
        [
            "layers.LeakyReLU()",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU()"
        ],
        [
            "layers.LSTM(512, dropout=0.1)",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "LSTM(512, dropout=0.1)"
        ],
        [
            "tf.concat(states, axis=-1)",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "concat(states, axis=-1)"
        ],
        [
            "tf.nn.log_softmax(logits, axis=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "log_softmax(logits, axis=-1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "tf.reshape(x, [batch_size, -1])  # batch_size is set to None which stood for batch_size? It is",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, -1])  # batch_size is set to None which stood for batch_size? It is"
        ],
        [
            "layers.MultiHeadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiHeadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = tf.contrib.seq2seq.MultiHeadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = tf.layers.Dropout(rate=args.dropout, training=self.training)\nself.norm1 = tf.contrib.layers.LayerNormalization(args.d_model)\n\nself.drop2 = tf.layers.Dropout(rate=args.dropout, training=self.training)\nself.norm2 = tf.contrib.layers.LayerNormalization(args",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "self.attn = tf.contrib.seq2seq.MultiHeadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = tf.layers.Dropout(rate=args.dropout, training=self.training)\nself.norm1 = tf.contrib.layers.LayerNormalization(args.d_model)\n\nself.drop2 = tf.layers.Dropout(rate=args.dropout, training=self.training)\nself.norm2 = tf.contrib.layers.LayerNormalization(args"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "return tf.compat.v1.nn.log_softmax(x, axis=-1)\n\ndef get_chkp(model, epoch, suffix=''):\n    state = {\n            '",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "return tf.compat.v1.nn.log_softmax(x, axis=-1)\n\ndef get_chkp(model, epoch, suffix=''):\n    state = {\n            '"
        ],
        [
            "\n",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "\n"
        ],
        [
            "\n     tf.TensorSpec(x.shape, x.dtype))) ",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "\n     tf.TensorSpec(x.shape, x.dtype))) "
        ],
        [
            "y = self.ffn2(tf.keras.activations.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\nprint(\"all done\")",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "y = self.ffn2(tf.keras.activations.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\nprint(\"all done\")"
        ],
        [
            "beta_initializer=tf.initializers.constant(betas)\ngamma_initializer=tf.initializers.constant(gammas)\nself.bn1 = layers.BatchNormalization(beta_initializer=beta_initializer,\n                                     gamma_initializer=gamma_initializer)\nself.act1 = activation()\n\ninitializers=tf.keras.initializers\nself.conv1 = layers.Conv2D(dim,\n                          ",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "beta_initializer=tf.initializers.constant(betas)\ngamma_initializer=tf.initializers.constant(gammas)\nself.bn1 = layers.BatchNormalization(beta_initializer=beta_initializer,\n                                     gamma_initializer=gamma_initializer)\nself.act1 = activation()\n\ninitializers=tf.keras.initializers\nself.conv1 = layers.Conv2D(dim,\n                          "
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "layers.MaxPooling1D(pool_size=3, strides=2)\n\n     # Classifier is just a single Fully Connected Layer\n\n # PyTor",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPooling1D(pool_size=3, strides=2)\n\n     # Classifier is just a single Fully Connected Layer\n\n # PyTor"
        ],
        [
            "\n",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "\n"
        ],
        [
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False))\n\n",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False))\n\n"
        ]
    ]
]