[
    [
        [
            "layers.Conv2d(64, 128, 3)",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2d(64, 128, 3)"
        ],
        [
            "layers.Conv2d(input_shape=[dim_in, dim_out], 3, 2)",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2d(input_shape=[dim_in, dim_out], 3, 2)"
        ],
        [
            "layers.ReLU()",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "ReLU()"
        ],
        [
            "layers.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1)"
        ],
        [
            "layers.Linear(dim_in, dim_out)",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Linear(dim_in, dim_out)"
        ],
        [
            "x = tf.nn.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "x = tf.nn.relu(self.fc(x))"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "embedding_dim = 512\nself.embed_tokens = embedding_layer(n_words, embedding_dim)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "embedding_dim = 512\nself.embed_tokens = embedding_layer(n_words, embedding_dim)"
        ],
        [
            "layers.MaxPooling2D(kernel_size=2, stride=2)",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPooling2D(kernel_size=2, stride=2)"
        ],
        [
            "self.bn1 = layers.BatchNormalization(axis=0)\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2d(dim, dim, 3)\nself.pool1 = layers.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(axis=0)\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2d(dim, dim, 3)\nself.pool1 = layers.MaxPool2d(3, 2)"
        ],
        [
            "self.bn1 = layers.BatchNorm2d(num_channels)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2d(num_channels, num_channels, 3)\nself.pool1 = layers.AvgPool2d(2, 2)\n\nself.bn2 = nn.BatchNorm2d(num_channels)\nself.act2 = nn.ReLU()\nself.conv2 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool2 = nn.AvgPool2d(2, 2)\nself",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNorm2d(num_channels)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2d(num_channels, num_channels, 3)\nself.pool1 = layers.AvgPool2d(2, 2)\n\nself.bn2 = nn.BatchNorm2d(num_channels)\nself.act2 = nn.ReLU()\nself.conv2 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool2 = nn.AvgPool2d(2, 2)\nself"
        ],
        [
            "layers.LayerNormalization(dim)",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "LayerNormalization(dim)"
        ],
        [
            "layers.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "layers.LSTM(512, 512, dropout=0.1)",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "LSTM(512, 512, dropout=0.1)"
        ],
        [
            "tf.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "cat(states, dim=-1)"
        ],
        [
            "tf.nn.log_softmax(logits, axis=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "log_softmax(logits, axis=-1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)"
        ],
        [
            "tf.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "layers.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = layers.MultiheadAttention(d_model, n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(dropout=args.dropout)\nself.norm1 = layers.LayerNorm(d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "self.attn = layers.MultiheadAttention(d_model, n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(dropout=args.dropout)\nself.norm1 = layers.LayerNorm(d_model)"
        ],
        [
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))"
        ],
        [
            "x = self.classifier(x)\nreturn x",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "x = self.classifier(x)\nreturn x"
        ],
        [
            "z = tf.reshape(x, [bsz, -1]) + tf.reshape(y, [bsz, -1])",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "z = tf.reshape(x, [bsz, -1]) + tf.reshape(y, [bsz, -1])"
        ],
        [
            "x = layers.Input(x)",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "x = layers.Input(x)"
        ],
        [
            "y = self.fc(x)\nx = x + self.dropout(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "y = self.fc(x)\nx = x + self.dropout(y)"
        ],
        [
            "self.bn1 = layers.BatchNormalization(args.dim)\nself.act1 = activation()\nself.conv1 = layers.Convolution(args.dim, 3, 3, activation='relu')\nself.pool1 = layers.MaxPooling2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(args.dim)\nself.act1 = activation()\nself.conv1 = layers.Convolution(args.dim, 3, 3, activation='relu')\nself.pool1 = layers.MaxPooling2d(3, 2)"
        ],
        [
            "self.layer_1 = layers.Conv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "self.layer_1 = layers.Conv2D(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "layers.MaxPooling2D(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPooling2D(kernel_size=3, stride=2)"
        ],
        [
            "self.fc = layers.Linear(dim)",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "self.fc = layers.Linear(dim)"
        ],
        [
            "layers.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)"
        ]
    ],
    [
        [
            "layers.Conv2d(64, 128, 3)",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2d(64, 128, 3)"
        ],
        [
            "layers.Conv2d(dim_in, dim_out, 3, 2)",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2d(dim_in, dim_out, 3, 2)"
        ],
        [
            "layers.ReLU()",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "ReLU()"
        ],
        [
            "layers.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1)"
        ],
        [
            "layers.Linear(dim_in, dim_out)",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Linear(dim_in, dim_out)"
        ],
        [
            "x = tf.nn.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "x = tf.nn.relu(self.fc(x))"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "self.embed_tokens = embedding_layer(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "self.embed_tokens = embedding_layer(n_words, dim_emb)"
        ],
        [
            "layers.MaxPooling2D(pool_size=(2, 2))",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPooling2D(pool_size=(2, 2))"
        ],
        [
            "self.bn1 = tf.nn.batch_normalization(\n\ndim,\n\nname='bn1')\nself.act1 = tf.nn.leaky_relu(\n\nalpha=0.2,\n\nname='act1')\nself.conv1 = tf.nn.conv2d(\n\ninput_shape=(\n\ndim,\n\ndim),\n\nkernel_size=(\n\n3,\n\n3),\n\nstrides=(\n\n1,\n\n1),\n\npadding='SAME'\n\n)\nself.pool1 = tf.nn.max_pool(\n\ninput_shape=(\n\ndim",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = tf.nn.batch_normalization(\n\ndim,\n\nname='bn1')\nself.act1 = tf.nn.leaky_relu(\n\nalpha=0.2,\n\nname='act1')\nself.conv1 = tf.nn.conv2d(\n\ninput_shape=(\n\ndim,\n\ndim),\n\nkernel_size=(\n\n3,\n\n3),\n\nstrides=(\n\n1,\n\n1),\n\npadding='SAME'\n\n)\nself.pool1 = tf.nn.max_pool(\n\ninput_shape=(\n\ndim"
        ],
        [
            "self.bn1 = layers.BatchNorm2d(num_channels)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2d(num_channels, num_channels, 3)\nself.pool1 = layers.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNorm2d(num_channels)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2d(num_channels, num_channels, 3)\nself.pool1 = layers.AvgPool2d(2, 2)"
        ],
        [
            "layers.LayerNormalization(dim)",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "LayerNormalization(dim)"
        ],
        [
            "layers.LeakyReLU()",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU()"
        ],
        [
            "layers.LSTM(512, 512, dropout=0.1)",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "LSTM(512, 512, dropout=0.1)"
        ],
        [
            "tf.nn.cat(states, axis=-1)",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "nn.cat(states, axis=-1)"
        ],
        [
            "tf.nn.softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, dim=-1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)"
        ],
        [
            "tf.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "layers.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = layers.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "self.attn = layers.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNorm(args.d_model)"
        ],
        [
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))"
        ],
        [
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, dim=-1)"
        ],
        [
            "z = layers.Concatenate([x, y], axis=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "z = layers.Concatenate([x, y], axis=1)"
        ],
        [
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "x = self.layer1(x)"
        ],
        [
            "y = layers.Flatten()\nx = x + layers.Dropout(0.5)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "y = layers.Flatten()\nx = x + layers.Dropout(0.5)"
        ],
        [
            "self.bn1 = layers.BatchNorm(dim)\nself.act1 = activation()\nself.conv1 = layers.Conv2D(filters=128, strides=2, kernel_size=5, use_bias=False)\nself.pool1 = layers.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNorm(dim)\nself.act1 = activation()\nself.conv1 = layers.Conv2D(filters=128, strides=2, kernel_size=5, use_bias=False)\nself.pool1 = layers.MaxPool2d(3, 2)"
        ],
        [
            "self.layer_1 = layers.Conv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "self.layer_1 = layers.Conv2D(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "layers.MaxPooling2D(kernel_size=3, strides=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPooling2D(kernel_size=3, strides=2)"
        ],
        [
            "self.fc = layers.Linear(dim, activation='relu')",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "self.fc = layers.Linear(dim, activation='relu')"
        ],
        [
            "layers.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)"
        ]
    ],
    [
        [
            "layers.Conv2D(64, 128, 3, activation='relu')",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2D(64, 128, 3, activation='relu')"
        ],
        [
            "layers.Conv2d(inputs=x, kernel_size=3, strides=2, padding='SAME')",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2d(inputs=x, kernel_size=3, strides=2, padding='SAME')"
        ],
        [
            "layers.ReLU()",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "ReLU()"
        ],
        [
            "layers.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1)"
        ],
        [
            "layers.Linear(dim_in, dim_out)",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Linear(dim_in, dim_out)"
        ],
        [
            "x = tf.nn.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "x = tf.nn.relu(self.fc(x))"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "embed_tokens = layers.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "embed_tokens = layers.Embedding(n_words, dim_emb)"
        ],
        [
            "layers.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPool2d(2, 2)"
        ],
        [
            "self.bn1 = layers.BatchNormalization(dim)\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2d(dim, dim, 3)\nself.pool1 = layers.MaxPool2d(3, 2)\n\ndef forward(self, x):\n\nx = F.relu(self.ffn1(x))\nx = x + self.drop(x)\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(dim)\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2d(dim, dim, 3)\nself.pool1 = layers.MaxPool2d(3, 2)\n\ndef forward(self, x):\n\nx = F.relu(self.ffn1(x))\nx = x + self.drop(x)\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)"
        ],
        [
            "self.bn1 = layers.BatchNorm(axis=1)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2d(num_channels, num_channels, 3)\nself.pool1 = layers.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNorm(axis=1)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2d(num_channels, num_channels, 3)\nself.pool1 = layers.AvgPool2d(2, 2)"
        ],
        [
            "layers.LayerNorm(dim)",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "LayerNorm(dim)"
        ],
        [
            "layers.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "layers.LSTM(512, 512, dropout=0.1)",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "LSTM(512, 512, dropout=0.1)"
        ],
        [
            "tf.concat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "concat(states, dim=-1)"
        ],
        [
            "tf.nn.softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, dim=-1)"
        ],
        [
            "tf.nn.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, dim=-1)"
        ],
        [
            "tf.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "layers.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=dropout)"
        ],
        [
            "self.attn = layers.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "self.attn = layers.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNorm(args.d_model)"
        ],
        [
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))"
        ],
        [
            "x = self.classifier(x)\nreturn x.log_softmax(axis=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "x = self.classifier(x)\nreturn x.log_softmax(axis=-1)"
        ],
        [
            "z = layers.Concatenate([x, y], axis=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "z = layers.Concatenate([x, y], axis=1)"
        ],
        [
            "x = layers.Input(shape=(1024,))",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "x = layers.Input(shape=(1024,))"
        ],
        [
            "y = F.relu(self.ffn1(x))\nx = x + layers.dropout(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "y = F.relu(self.ffn1(x))\nx = x + layers.dropout(y)"
        ],
        [
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\ndef forward(self, x):\n\nx = F.relu(self.bn1(x))\nx = self.conv1(x)\nx = self.pool1(x)\nreturn x",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\ndef forward(self, x):\n\nx = F.relu(self.bn1(x))\nx = self.conv1(x)\nx = self.pool1(x)\nreturn x"
        ],
        [
            "self.layer_1 = layers.Conv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "self.layer_1 = layers.Conv2D(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "layers.MaxPooling2D(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPooling2D(kernel_size=3, stride=2)"
        ],
        [
            "self.fc = layers.Linear(dim)",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "self.fc = layers.Linear(dim)"
        ],
        [
            "layers.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)"
        ]
    ],
    [
        [
            "layers.Conv2D(64, 128, 3)",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2D(64, 128, 3)"
        ],
        [
            "layers.Conv2d(dim_in, dim_out, 3, 2)",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2d(dim_in, dim_out, 3, 2)"
        ],
        [
            "layers.ReLU()",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "ReLU()"
        ],
        [
            "layers.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1)"
        ],
        [
            "layers.Linear(dim_in, dim_out)",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Linear(dim_in, dim_out)"
        ],
        [
            "x = tf.nn.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "x = tf.nn.relu(self.fc(x))"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb)"
        ],
        [
            "layers.MaxPooling2D(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPooling2D(2, 2)"
        ],
        [
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2d(dim, dim, 3)\nself.pool1 = layers.MaxPool2d(3, 2)\n\ndef forward(self, x):\nz = self.bn1(x)\nz = self.act1(z)\nz = self.conv1(z)\nz = self.pool1(z)\nreturn z",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2d(dim, dim, 3)\nself.pool1 = layers.MaxPool2d(3, 2)\n\ndef forward(self, x):\nz = self.bn1(x)\nz = self.act1(z)\nz = self.conv1(z)\nz = self.pool1(z)\nreturn z"
        ],
        [
            "layers.BatchNormalization(axis=0)\nlayers.Activation('relu')\nlayers.Conv2D(channels, channels, 3)\nlayers.Pooling2D(pool_size=2, strides=2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "layers.BatchNormalization(axis=0)\nlayers.Activation('relu')\nlayers.Conv2D(channels, channels, 3)\nlayers.Pooling2D(pool_size=2, strides=2)"
        ],
        [
            "layers.LayerNorm(axis)",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "LayerNorm(axis)"
        ],
        [
            "layers.LeakyReLU()",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU()"
        ],
        [
            "layers.LSTM(512, 512, dropout=0.1)",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "LSTM(512, 512, dropout=0.1)"
        ],
        [
            "tf.concat([states], axis=-1)",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "concat([states], axis=-1)"
        ],
        [
            "tf.nn.softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, dim=-1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)"
        ],
        [
            "tf.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "layers.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = layers.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "self.attn = layers.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNorm(args.d_model)"
        ],
        [
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))"
        ],
        [
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)"
        ],
        [
            "z = tf.reshape(x, [-1, bsz]) + tf.reshape(y, [-1, bsz])",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "z = tf.reshape(x, [-1, bsz]) + tf.reshape(y, [-1, bsz])"
        ],
        [
            "x = self.bn1(x) + self.act1(x)",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "x = self.bn1(x) + self.act1(x)"
        ],
        [
            "y = self.activation(F.relu(self.activation(x)))\nx = x + self.dropout(y, keep_prob=0.5)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "y = self.activation(F.relu(self.activation(x)))\nx = x + self.dropout(y, keep_prob=0.5)"
        ],
        [
            "self.bn1 = layers.BatchNormalization(args.dim, momentum=0.9, decay=0.999)\nself.act1 = activation()\nself.conv1 = layers.Conv3x3(args.dim, kernel_size=3, padding='SAME')\nself.pool1 = layers.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(args.dim, momentum=0.9, decay=0.999)\nself.act1 = activation()\nself.conv1 = layers.Conv3x3(args.dim, kernel_size=3, padding='SAME')\nself.pool1 = layers.MaxPool2d(3, 2)"
        ],
        [
            "self.layer_1 = Conv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "self.layer_1 = Conv2D(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "layers.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPool2d(kernel_size=3, stride=2)"
        ],
        [
            "self.fc = Dense(1, activation='linear')",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "self.fc = Dense(1, activation='linear')"
        ],
        [
            "layers.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)"
        ]
    ],
    [
        [
            "layers.Conv2d(64, 128, 3)",
            "layers.Conv2D(128, 3)",
            "nn.Conv2d(64, 128, 3)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.",
            "Conv2d(64, 128, 3)"
        ],
        [
            "layers.Conv2d(dim_in, dim_out, 3, 2)",
            "layers.Conv2D(dim_out, 3, 2)",
            "nn.Conv2d(dim_in, dim_out, 3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.",
            "Conv2d(dim_in, dim_out, 3, 2)"
        ],
        [
            "layers.ReLU()",
            "layers.ReLU()",
            "nn.ReLU()",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.",
            "ReLU()"
        ],
        [
            "layers.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.",
            "Dropout(0.1)"
        ],
        [
            "layers.Linear(dim_in, dim_out)",
            "layers.Dense(dim_out)",
            "nn.Linear(dim_in, dim_out)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.",
            "Linear(dim_in, dim_out)"
        ],
        [
            "x = tf.nn.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "x = F.relu(self.fc(x))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\n",
            "x = tf.nn.relu(self.fc(x))"
        ],
        [
            "layers.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.Conv2d(dim_in, dim_out, 3, 2)\n# Keras\nlayers.Conv2D(dim_out, 3, 2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, max_len)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\n",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, max_len)"
        ],
        [
            "layers.MaxPooling2D(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.",
            "MaxPooling2D(2, 2)"
        ],
        [
            "self.bn1 = layers.BatchNormalization(axis=0)\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2d(dim, dim, 3)\nself.pool1 = layers.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(axis=0)\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2d(dim, dim, 3)\nself.pool1 = layers.MaxPool2d(3, 2)"
        ],
        [
            "self.bn1 = layers.BatchNorm(num_channels)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2d(num_channels, num_channels, 3)\nself.pool1 = layers.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNorm(num_channels)\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2d(num_channels, num_channels, 3)\nself.pool1 = layers.AvgPool2d(2, 2)"
        ],
        [
            "layers.L2(dim)",
            "layers.LayerNormalization()",
            "nn.LayerNorm(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.",
            "L2(dim)"
        ],
        [
            "layers.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "layers.LSTM(512, 512, dropout=0.1)",
            "layers.LSTM(512, dropout=0.1)",
            "nn.LSTM(512, 512, dropout=0.1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.",
            "LSTM(512, 512, dropout=0.1)"
        ],
        [
            "tf.concat(states, axis=-1)",
            "tf.concat(states, axis=-1)",
            "torch.cat(states, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.",
            "concat(states, axis=-1)"
        ],
        [
            "tf.nn.softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "F.log_softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, dim=-1)"
        ],
        [
            "tf.nn.softmax(logits, axis=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "F.softmax(logits, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.",
            "softmax(logits, axis=-1)"
        ],
        [
            "tf.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "layers.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate PyTorch to Keras\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.",
            "MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "\nself.attn = tf.nn.multi_head_attention(\n\nargs.d_model,\n\nargs.n_heads,\n\ndropout=args.att_dropout)\n\nself.drop1 = tf.nn.dropout(\n\nargs.dropout,\n\nkeep_prob=1.0)\n\nself.norm1 = tf.nn.layer_norm(\n\nargs.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\n",
            "\nself.attn = tf.nn.multi_head_attention(\n\nargs.d_model,\n\nargs.n_heads,\n\ndropout=args.att_dropout)\n\nself.drop1 = tf.nn.dropout(\n\nargs.dropout,\n\nkeep_prob=1.0)\n\nself.norm1 = tf.nn.layer_norm(\n\nargs.d_model)"
        ],
        [
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nnn.Dropout(0.1)\n# Keras\nlayers.Dropout(0.1)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\n",
            "self.rnn = (layers.LSTM(d_model, d_model) if rnn_type == 'LSTM' else layers.GRU(d_model, d_model))"
        ],
        [
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\nself.fc = CustomLinear(dim)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\n",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, dim=-1)"
        ],
        [
            "z = tf.concat([x, y], axis=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n# Keras\n",
            "z = tf.concat([x, y], axis=1)"
        ],
        [
            "x = tf.nn.linear(x, self.layer1_weight) +",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nx = F.relu(self.fc(x))\n# Keras\nx = tf.nn.relu(self.fc(x))\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)\n\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\n",
            "x = tf.nn.linear(x, self.layer1_weight) +"
        ],
        [
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\n",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)"
        ],
        [
            "self.bn1 = layers.BatchNormalization(axis=0)\nself.act1 = activation()\nself.conv1 = layers.Convolution(kernel_size=3, input_shape=(dim,), activation='relu')\nself.pool1 = layers.MaxPooling2d(pool_size=2, strides=2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LayerNorm(dim)\n# Keras\nlayers.LayerNormalization()\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# PyTorch\nnn.LeakyReLU(args.leaky)\n# Keras\nlayers.LeakyReLU(args.leaky)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\n",
            "self.bn1 = layers.BatchNormalization(axis=0)\nself.act1 = activation()\nself.conv1 = layers.Convolution(kernel_size=3, input_shape=(dim,), activation='relu')\nself.pool1 = layers.MaxPooling2d(pool_size=2, strides=2)"
        ],
        [
            "self.layer_1 = layers.Conv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.Conv2d(64, 128, 3)\n# Keras\nlayers.Conv2D(128, 3)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n# Keras\ntf.reshape(x, [batch_size, -1])\n\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# Keras\n",
            "self.layer_1 = layers.Conv2D(planes, kernel=3, stride=1, dilation=2)"
        ],
        [
            "layers.MaxPooling2D(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# PyTorch\nx = self.layer1(x)\n# Keras\nx = self.layer1(x)\n\n# PyTorch\nnn.Linear(dim_in, dim_out)\n# Keras\nlayers.Dense(dim_out)\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.",
            "MaxPooling2D(kernel_size=3, stride=2)"
        ],
        [
            "layers.Linear(dim)",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n\n# PyTorch\ntorch.cat(states, dim=-1)\n# Keras\ntf.concat(states, axis=-1)\n\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n\n# PyTorch\nF.log_softmax(logits, dim=-1)\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n\n# PyTorch\nself.fc = CustomLinear(dim)\n# Keras\n",
            "layers.Linear(dim)"
        ],
        [
            "layers.Conv2D(128, 512, stride=2, kernel_size=5, bias=False)",
            "layers.Conv2D(filters=512, strides=2, kernel_size=5, use_bias=False)",
            "nn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)",
            "# Translate PyTorch to Keras\n\n# PyTorch\nnn.LSTM(512, 512, dropout=0.1)\n# Keras\nlayers.LSTM(512, dropout=0.1)\n\n# PyTorch\nnn.MaxPool2d(2, 2)\n# Keras\nlayers.MaxPooling2D(2, 2)\n\n# PyTorch\nnn.ReLU()\n# Keras\nlayers.ReLU()\n\n# PyTorch\nF.softmax(logits, dim=-1)\n# Keras\ntf.nn.softmax(logits, axis=-1)\n\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n\n# PyTorch\nnn.Conv2d(in_channels=128, out_channels=512, stride=2, kernel_size=5, bias=False)\n# Keras\nlayers.",
            "Conv2D(128, 512, stride=2, kernel_size=5, bias=False)"
        ]
    ]
]