[
    [
        [
            "nn.ReLU()",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU()"
        ],
        [
            "nn.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout(0.1)"
        ],
        [
            "x = nn.ReLU(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "x = nn.ReLU(self.fc(x))"
        ],
        [
            "nn.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "embedding = nn.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "embedding = nn.Embedding(n_words, dim_emb, input_length=max_len)"
        ],
        [
            "nn.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPooling2D(2, 2)"
        ],
        [
            "layer_defs = [\n\nbatch_normalization(),\nleaky_relu(),\nconv2d(),\nmax_pooling2d()\n]\n\ndef forward(self, x):\n\nx = F.batch_normalization(x)\nx = self.leaky_relu(x)\nx = F.conv2d(x, 32)\nx = F.max_pooling2d(x, 2, 2)\nreturn x",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "layer_defs = [\n\nbatch_normalization(),\nleaky_relu(),\nconv2d(),\nmax_pooling2d()\n]\n\ndef forward(self, x):\n\nx = F.batch_normalization(x)\nx = self.leaky_relu(x)\nx = F.conv2d(x, 32)\nx = F.max_pooling2d(x, 2, 2)\nreturn x"
        ],
        [
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2D(num_channels, 3)\nself.pool1 = nn.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2D(num_channels, 3)\nself.pool1 = nn.AveragePooling2D(2, 2)"
        ],
        [
            "nn.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "torch.cat(states.Tensor, axis=-1)",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "cat(states.Tensor, axis=-1)"
        ],
        [
            "F.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, axis=-1)"
        ],
        [
            "F.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "softmax(logits, axis=-1)"
        ],
        [
            "torch.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "nn.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = nn.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "self.attn = nn.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)"
        ],
        [
            "self.rnn = (nn.LSTM(d_model) if rnn_type == 'LSTM' else nn.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "self.rnn = (nn.LSTM(d_model) if rnn_type == 'LSTM' else nn.GRU(d_model))"
        ],
        [
            "y = self.classifier(x)\nreturn y",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "y = self.classifier(x)\nreturn y"
        ],
        [
            "z = torch.concat([x.view(-1, -1), y.view(-1, -1)], 1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "z = torch.concat([x.view(-1, -1), y.view(-1, -1)], 1)"
        ],
        [
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "x = self.layer1(x)"
        ],
        [
            "y = torch.nn.relu(self.ffn1(x))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            "y = torch.nn.relu(self.ffn1(x))\nx = x + self.drop(y)"
        ],
        [
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.Activation()\nself.conv1 = nn.Conv3x3(dim)\nself.pool1 = nn.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.Activation()\nself.conv1 = nn.Conv3x3(dim)\nself.pool1 = nn.MaxPooling2D(3, 2)"
        ],
        [
            "self.layer_1 = torch.nn.Conv2d(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "self.layer_1 = torch.nn.Conv2d(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "nn.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPooling2D(pool_size=3, strides=2)"
        ],
        [
            "self.fc = nn.Linear(dim)",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "self.fc = nn.Linear(dim)"
        ]
    ],
    [
        [
            "nn.ReLU()",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU()"
        ],
        [
            "nn.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout(0.1)"
        ],
        [
            "x = F.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "x = F.relu(self.fc(x))"
        ],
        [
            "nn.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb, input_length=max_len)"
        ],
        [
            "nn.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPooling2D(2, 2)"
        ],
        [
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2D(dim, 3)\nself.pool1 = nn.MaxPooling2D(3, 2)\n\nclassifier = keras.models.Sequential()\nclassifier.add(layers.Dense(10, activation='softmax'))\nclassifier.compile(loss='categorical_crossentropy',\noptimizer='adam',\nmetrics",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2D(dim, 3)\nself.pool1 = nn.MaxPooling2D(3, 2)\n\nclassifier = keras.models.Sequential()\nclassifier.add(layers.Dense(10, activation='softmax'))\nclassifier.compile(loss='categorical_crossentropy',\noptimizer='adam',\nmetrics"
        ],
        [
            "nn.BatchNormalization()\nnn.ReLU()\nnn.Conv2D(num_channels, 3)\nnn.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "nn.BatchNormalization()\nnn.ReLU()\nnn.Conv2D(num_channels, 3)\nnn.AveragePooling2D(2, 2)"
        ],
        [
            "nn.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "torch.concat(states, -1)",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "concat(states, -1)"
        ],
        [
            "F.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, axis=-1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "torch.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "nn.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "\nclass MultiHeadAttention(nn.Module):\n\ndef __init__(self, n_heads, d_model, dropout=0.0):\n\nsuper().__init__()\n\nself.param_scope = \"attention\"\n\nself.n_heads = n_heads\n\nself.d_model = d_model\n\nself.dropout = dropout\n\n\ndef forward(self, x):\n\nh1 = F.head(x, 1)\nh2 = F.head(x, 2)\n\natt = self.attn(h1, h2)\n",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "\nclass MultiHeadAttention(nn.Module):\n\ndef __init__(self, n_heads, d_model, dropout=0.0):\n\nsuper().__init__()\n\nself.param_scope = \"attention\"\n\nself.n_heads = n_heads\n\nself.d_model = d_model\n\nself.dropout = dropout\n\n\ndef forward(self, x):\n\nh1 = F.head(x, 1)\nh2 = F.head(x, 2)\n\natt = self.attn(h1, h2)\n"
        ],
        [
            "self.rnn = torch.nn.LSTM(d_model, use_peephole=True)",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "self.rnn = torch.nn.LSTM(d_model, use_peephole=True)"
        ],
        [
            "x = self.classifier(x)\nreturn torch.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "x = self.classifier(x)\nreturn torch.log_softmax(x, dim=-1)"
        ],
        [
            "z = torch.concat([x, y], dim=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "z = torch.concat([x, y], dim=1)"
        ],
        [
            "x = x",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "x = x"
        ],
        [
            "y = F.relu(self.fc(x))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            "y = F.relu(self.fc(x))\nx = x + self.drop(y)"
        ],
        [
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.activation()\nself.conv1 = nn. Conv3x3(dim)\nself.pool1 = nn. MaxPooling2D(3, 2)\n\ndef forward(self, input):\n\n\"\"\"\n\nPerform the forward pass for the model.\n\n:param input: The input to the model.\n\n:return: The output of",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.activation()\nself.conv1 = nn. Conv3x3(dim)\nself.pool1 = nn. MaxPooling2D(3, 2)\n\ndef forward(self, input):\n\n\"\"\"\n\nPerform the forward pass for the model.\n\n:param input: The input to the model.\n\n:return: The output of"
        ],
        [
            "self.layer_1 = F.Conv2d(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "self.layer_1 = F.Conv2d(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "nn.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPooling2D(pool_size=3, strides=2)"
        ],
        [
            "self.fc = nn.Linear(dim, dropout=args.out_drop",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "self.fc = nn.Linear(dim, dropout=args.out_drop"
        ]
    ],
    [
        [
            "nn.ReLU()",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU()"
        ],
        [
            "nn.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout(0.1)"
        ],
        [
            "x = F.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "x = F.relu(self.fc(x))"
        ],
        [
            "nn.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "self.embed_tokens = nn.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "self.embed_tokens = nn.Embedding(n_words, dim_emb, input_length=max_len)"
        ],
        [
            "nn.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPooling2D(2, 2)"
        ],
        [
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2D(dim, 3)\nself.pool1 = nn.MaxPooling2D(3, 2)\n\nself.bn2 = layers.BatchNormalization()\nself.act2 = layers.LeakyReLU(0.2)\nself.conv2 = layers.Conv2D(dim, 3)\nself.pool2 = layers.MaxPooling2",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2D(dim, 3)\nself.pool1 = nn.MaxPooling2D(3, 2)\n\nself.bn2 = layers.BatchNormalization()\nself.act2 = layers.LeakyReLU(0.2)\nself.conv2 = layers.Conv2D(dim, 3)\nself.pool2 = layers.MaxPooling2"
        ],
        [
            "nn.BatchNormalization(\u2026)\nnn.ReLU(\u2026)\nnn.Conv2d(\u2026)\nnn.AveragePooling2d(\u2026)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "nn.BatchNormalization(\u2026)\nnn.ReLU(\u2026)\nnn.Conv2d(\u2026)\nnn.AveragePooling2d(\u2026)"
        ],
        [
            "nn.LeakyReLU(alpha=args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(alpha=args.leaky)"
        ],
        [
            "torch.cat(states, dim=-1)",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "cat(states, dim=-1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "torch.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "nn.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = nn.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "self.attn = nn.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNormalization(args.d_model)"
        ],
        [
            "self.rnn = (nn.LSTM(d_model) if rnn_type == 'LSTM' else nn.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "self.rnn = (nn.LSTM(d_model) if rnn_type == 'LSTM' else nn.GRU(d_model))"
        ],
        [
            "F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "F.log_softmax(x, dim=-1)"
        ],
        [
            "z = torch.cat([x, y], dim=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "z = torch.cat([x, y], dim=1)"
        ],
        [
            "x = x",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "x = x"
        ],
        [
            " F.relu(x)\n y = F.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            " F.relu(x)\n y = F.drop(y)"
        ],
        [
            "\nself.bn1 = nn.BatchNormalization()\nself.act1 = activation()\nself.conv1 = torch.nn.Conv3x3(dim)\nself.pool1 = torch.nn.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "\nself.bn1 = nn.BatchNormalization()\nself.act1 = activation()\nself.conv1 = torch.nn.Conv3x3(dim)\nself.pool1 = torch.nn.MaxPooling2D(3, 2)"
        ],
        [
            "self.layer_1 = nn.Conv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "self.layer_1 = nn.Conv2D(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "nn.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPooling2D(pool_size=3, strides=2)"
        ],
        [
            "x = F.linear(dim, dim)",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "x = F.linear(dim, dim)"
        ]
    ],
    [
        [
            "nn.ReLU()",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU()"
        ],
        [
            "nn.Dropout(p=0.1)",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout(p=0.1)"
        ],
        [
            "F.relu(x)",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "F.relu(x)"
        ],
        [
            "nn.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "embed_tokens = nn.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "embed_tokens = nn.Embedding(n_words, dim_emb, input_length=max_len)"
        ],
        [
            "nn.MaxPool2d(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPool2d(2, 2)"
        ],
        [
            "nn.BatchNormalization(),\nnn.LeakyReLU(),\nnn.Conv2D(),\nnn.MaxPooling2D()",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "nn.BatchNormalization(),\nnn.LeakyReLU(),\nnn.Conv2D(),\nnn.MaxPooling2D()"
        ],
        [
            "\nself.bn1 = nn.BatchNormalization()\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2D(args.num_channels, 3)\nself.pool1 = nn.AveragePooling2D(args.pool_size, args.pool_size)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "\nself.bn1 = nn.BatchNormalization()\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2D(args.num_channels, 3)\nself.pool1 = nn.AveragePooling2D(args.pool_size, args.pool_size)"
        ],
        [
            "nn.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "torch.cat(states, dim=-1)",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "cat(states, dim=-1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "F.log_softmax(logits, dim=1)",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=1)"
        ],
        [
            "torch.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "nn.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = nn.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "self.attn = nn.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNormalization(args.d_model)"
        ],
        [
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))"
        ],
        [
            "x = F.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "x = F.log_softmax(x, axis=-1)"
        ],
        [
            "z = x.view(x.size(0), -1).concat(y.view(y.size(0), -1))",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "z = x.view(x.size(0), -1).concat(y.view(y.size(0), -1))"
        ],
        [
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "x = self.layer1(x)"
        ],
        [
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)"
        ],
        [
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv3x3(dim)\nself.pool1 = nn.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv3x3(dim)\nself.pool1 = nn.MaxPooling2D(3, 2)"
        ],
        [
            "self.layer_1 = nn.Conv2d(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "self.layer_1 = nn.Conv2d(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "nn.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPooling2D(pool_size=3, strides=2)"
        ],
        [
            "self.fc = torch.nn. Linear (dim, batch_size)",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "self.fc = torch.nn. Linear (dim, batch_size)"
        ]
    ],
    [
        [
            "nn.ReLU()",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU()"
        ],
        [
            "nn.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout(0.1)"
        ],
        [
            "x = F.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "x = F.relu(self.fc(x))"
        ],
        [
            "nn.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb, input_length=max_len)\n\nself.fc1 = layers.Linear(dim_out, 512)\nself.out = self.fc1(z)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb, input_length=max_len)\n\nself.fc1 = layers.Linear(dim_out, 512)\nself.out = self.fc1(z)"
        ],
        [
            "nn.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPooling2D(2, 2)"
        ],
        [
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2D(dim, 3)\nself.pool1 = nn.MaxPooling2D(3, 2)\n\ndef classify(self, x):\n\npreds = self.rnn(x)\n\npreds = F.softmax(preds, dim=self.class_dim)\n\nreturn preds",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2D(dim, 3)\nself.pool1 = nn.MaxPooling2D(3, 2)\n\ndef classify(self, x):\n\npreds = self.rnn(x)\n\npreds = F.softmax(preds, dim=self.class_dim)\n\nreturn preds"
        ],
        [
            "nn.BatchNorm2d(num_channels, True)\nnn.ReLU()\nnn.Conv2d( num_channels, 3, kernel_size=3, padding='same', strides=1)\nnn.AvgPool2d(kernel_size=3, padding='same', strides=1)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "nn.BatchNorm2d(num_channels, True)\nnn.ReLU()\nnn.Conv2d( num_channels, 3, kernel_size=3, padding='same', strides=1)\nnn.AvgPool2d(kernel_size=3, padding='same', strides=1)"
        ],
        [
            "nn.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "torch.cat(states, -1)",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "cat(states, -1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "torch.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "nn.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = nn.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "self.attn = nn.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNormalization(args.d_model)"
        ],
        [
            "rnn = nn.LSTM(d_model) if rnn_type == \"LSTM\" else nn.GRU(d_model)",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "rnn = nn.LSTM(d_model) if rnn_type == \"LSTM\" else nn.GRU(d_model)"
        ],
        [
            "x = self.fc(x)\nreturn torch.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "x = self.fc(x)\nreturn torch.nn.log_softmax(x, axis=-1)"
        ],
        [
            "z = torch.cat([x, y], 1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "z = torch.cat([x, y], 1)"
        ],
        [
            "x = self.layer_1(x)",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "x = self.layer_1(x)"
        ],
        [
            "y = torch.mm(x, self.attn)\nx = x + torch.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            "y = torch.mm(x, self.attn)\nx = x + torch.drop(y)"
        ],
        [
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.ReLU()\nself.conv1 = torch.conv3x3(dim)\nself.pool1 = torch.max_pool2d(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNormalization()\nself.act1 = nn.ReLU()\nself.conv1 = torch.conv3x3(dim)\nself.pool1 = torch.max_pool2d(3, 2)"
        ],
        [
            "self.layer_1 = Conv2d(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "self.layer_1 = Conv2d(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "nn.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPooling2D(pool_size=3, strides=2)"
        ],
        [
            "self.fc = Linear(dim)",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "self.fc = Linear(dim)"
        ]
    ]
]