[
    [
        [
            "nn.ReLU() is already the default but put it in",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU() is already the default but put it in"
        ],
        [
            "nn.Dropout(p=0.1)",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout(p=0.1)"
        ],
        [
            "\n\n\n",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "\n\n\n"
        ],
        [
            "nn.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb, max_len)",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb, max_len)"
        ],
        [
            "nn.MaxPool2d(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPool2d(2, 2)"
        ],
        [
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(inplace=True)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\nbatchx.float()\nbatchx.long()\nbatchx.float().cpu()\nbatchx.float().cpu().detach().clone()\n\ninput = torch.randn(3, 5, requires_grad=True)\n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(inplace=True)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\nbatchx.float()\nbatchx.long()\nbatchx.float().cpu()\nbatchx.float().cpu().detach().clone()\n\ninput = torch.randn(3, 5, requires_grad=True)\n"
        ],
        [
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(in_channels=num_channels, out_channels=num_channels, kernel_size=3, padding=1)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n################################################################################\n\ndef compare_kernel_sizes_and_strides():\n  # conv in keras\n",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(in_channels=num_channels, out_channels=num_channels, kernel_size=3, padding=1)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n################################################################################\n\ndef compare_kernel_sizes_and_strides():\n  # conv in keras\n"
        ],
        [
            "nn.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "torch.cat(states, dim=-1)\n\n",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "cat(states, dim=-1)\n\n"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "F.softmax(logits, dim=1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "softmax(logits, dim=1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "torch.flatten(x) # (batch_size, -1)",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "flatten(x) # (batch_size, -1)"
        ],
        [
            "nn.MultiheadAttention(dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiheadAttention(dim=model_dim, num_heads=num_heads, dropout=attn_dropout)"
        ],
        [
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout2d(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\nif args.mask:\n\tmask = 2.0\nelse:\n\tmask = None\n\nif args.llr:\n\tllr_logits = 3.0\nelse:\n\tllr_logits = None\n\nif args.hlr:\n\thlr_",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout2d(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\nif args.mask:\n\tmask = 2.0\nelse:\n\tmask = None\n\nif args.llr:\n\tllr_logits = 3.0\nelse:\n\tllr_logits = None\n\nif args.hlr:\n\thlr_"
        ],
        [
            "\n",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "\n"
        ],
        [
            "return F.log_softmax(x, dim=-1)\n\n\n\na, b = x.size()[2:4]\nbbox[:, :, :, :, 0::2] = (x_c -",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "return F.log_softmax(x, dim=-1)\n\n\n\na, b = x.size()[2:4]\nbbox[:, :, :, :, 0::2] = (x_c -"
        ],
        [
            "\n",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "\n"
        ],
        [
            "\n",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "\n"
        ],
        [
            "y = self.ffn2(self.act1(self.ffn1(x)))\nx = x + self.drop(y)\n\n\"\"\" Attention Layer, Formula\n             |\n            (k)\n            \u2211_i \n            Q_i\n          V \n        = \u2014",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            "y = self.ffn2(self.act1(self.ffn1(x)))\nx = x + self.drop(y)\n\n\"\"\" Attention Layer, Formula\n             |\n            (k)\n            \u2211_i \n            Q_i\n          V \n        = \u2014"
        ],
        [
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = nn.Conv2d(dim, dim, 3, padding=1)\nself.pool1 = nn.MaxPool2d(3, 2)\n\nx = x0\nx = layers.Reshape((1, -1))(x)\nx = layers.Conv1D(64,",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = nn.Conv2d(dim, dim, 3, padding=1)\nself.pool1 = nn.MaxPool2d(3, 2)\n\nx = x0\nx = layers.Reshape((1, -1))(x)\nx = layers.Conv1D(64,"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "nn.MaxPool2d(kernel_size=3, stride=2)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPool2d(kernel_size=3, stride=2)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ]
    ],
    [
        [
            "nn.ReLU()",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU()"
        ],
        [
            "nn.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout(0.1)"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "nn.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "self.embed_tokens = nn.Embedding(n_words, dim_emb, max_norm=1, norm_type=2)\n\nimport torch\ntf_x = tf.placeholder(tf.float32, [2, 3])\ntorch_x = torch.randn((2",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "self.embed_tokens = nn.Embedding(n_words, dim_emb, max_norm=1, norm_type=2)\n\nimport torch\ntf_x = tf.placeholder(tf.float32, [2, 3])\ntorch_x = torch.randn((2"
        ],
        [
            "nn.MaxPool2d(2, stride=2, ceil_mode=True)",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPool2d(2, stride=2, ceil_mode=True)"
        ],
        [
            "nn.BatchNorm2d(dim)\ntorch.nn.LeakyReLU(0.2)\ntorch.nn.Conv2d(dim, dim, 3)\ntorch.nn.MaxPool2d(kernel_size=3, stride=2)\n\n## from tf.keras source code\n\ndef get_padding(x, padding_value=0):\n  \"\"\"Return float tensor representing the padding values in x.\n  Args:\n    x: int tensor with any shape\n    padding_value: int value that\n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "nn.BatchNorm2d(dim)\ntorch.nn.LeakyReLU(0.2)\ntorch.nn.Conv2d(dim, dim, 3)\ntorch.nn.MaxPool2d(kernel_size=3, stride=2)\n\n## from tf.keras source code\n\ndef get_padding(x, padding_value=0):\n  \"\"\"Return float tensor representing the padding values in x.\n  Args:\n    x: int tensor with any shape\n    padding_value: int value that\n"
        ],
        [
            "self.bn1= nn.BatchNorm2d(num_channels, affine=False)\nself.act1= nn.LeakyReLU(args.leaky)\nself.conv1= nn.Conv2d(num_channels, 512, 3)\nself.pool1= nn.AvgPool2d(2, 2)\n\n## Convert to PyTorch Layers\nclass PyTorchBatchNorm(BatchNorm):\n    \"\"\"docstring for PyTorchBatchNorm.\"\"\"",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "self.bn1= nn.BatchNorm2d(num_channels, affine=False)\nself.act1= nn.LeakyReLU(args.leaky)\nself.conv1= nn.Conv2d(num_channels, 512, 3)\nself.pool1= nn.AvgPool2d(2, 2)\n\n## Convert to PyTorch Layers\nclass PyTorchBatchNorm(BatchNorm):\n    \"\"\"docstring for PyTorchBatchNorm.\"\"\""
        ],
        [
            "nn.LeakyReLU(0.2)     if args.leaky\n\n    # if args.load and os.",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(0.2)     if args.leaky\n\n    # if args.load and os."
        ],
        [
            "torch.cat(states, dim=-1)",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "cat(states, dim=-1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "F.softmax(logits, dim=1)",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "softmax(logits, dim=1)"
        ],
        [
            "torch.Tensor.view(x.size(0), -1)",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "Tensor.view(x.size(0), -1)"
        ],
        [
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n"
        ],
        [
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\ndef forward(self, enc, mask_enc, dec, mask_dec, cache=None):\n      q = self.self_attn(dec, mask_dec, cache=cache)\n      mid, attn = self.enc_attn(enc, q, mask_enc, cache=",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\ndef forward(self, enc, mask_enc, dec, mask_dec, cache=None):\n      q = self.self_attn(dec, mask_dec, cache=cache)\n      mid, attn = self.enc_attn(enc, q, mask_enc, cache="
        ],
        [
            "\n    def forward(self, x):\n\n        batch_size = x.shape[0]\n\n        x = self.embedding(x)  # [batch_size, len_seq, d_model]\n\n        states = self.state_lstm(x)\n\n        x = states[0]  # [1, batch_",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "\n    def forward(self, x):\n\n        batch_size = x.shape[0]\n\n        x = self.embedding(x)  # [batch_size, len_seq, d_model]\n\n        states = self.state_lstm(x)\n\n        x = states[0]  # [1, batch_"
        ],
        [
            "return F.log_softmax(x, dim=-1)\n\n\n\nclass FeedForwardNetwork():\n  '''A FeedForwardNetwork'''\n\n  def __init__(self, dim_in, dim_out, dropout",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "return F.log_softmax(x, dim=-1)\n\n\n\nclass FeedForwardNetwork():\n  '''A FeedForwardNetwork'''\n\n  def __init__(self, dim_in, dim_out, dropout"
        ],
        [
            "\n",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "\n"
        ],
        [
            "\n    def forward(self, x):\n\n        for child in self.layer1",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "\n    def forward(self, x):\n\n        for child in self.layer1"
        ],
        [
            "y = self.ffn2(F.elu(self.ffn1(x)))\nx = x + self.drop(y)\n\n############################################################################################################\nseq_in = tf.random.uniform(shape=(12, 256, 128))  # <-- our input data\n",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            "y = self.ffn2(F.elu(self.ffn1(x)))\nx = x + self.drop(y)\n\n############################################################################################################\nseq_in = tf.random.uniform(shape=(12, 256, 128))  # <-- our input data\n"
        ],
        [
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = nn.Conv2d(dim, dim, (3, 3), padding=1)\nself.pool1 = nn.MaxPool2d((3, 2))\n\ndef train(model, iterators, criterion, optimizers=None):\n  \n  train_iter, test_iter = iterators #",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = nn.Conv2d(dim, dim, (3, 3), padding=1)\nself.pool1 = nn.MaxPool2d((3, 2))\n\ndef train(model, iterators, criterion, optimizers=None):\n  \n  train_iter, test_iter = iterators #"
        ],
        [
            "\n        self.layer_1 = conv_block.BasicConvBlock(inp=inp, oup=planes, kernel_size=3, padding=2, stride=1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "\n        self.layer_1 = conv_block.BasicConvBlock(inp=inp, oup=planes, kernel_size=3, padding=2, stride=1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPool2d(kernel_size=3, stride=2)"
        ],
        [
            "\n\tdef forward(self, x):\n\n\t\tif self.require_grads:",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "\n\tdef forward(self, x):\n\n\t\tif self.require_grads:"
        ]
    ],
    [
        [
            "nn.ReLU()",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU()"
        ],
        [
            "nn.Dropout(0.1)",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout(0.1)"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "nn.Embedding(vocab_size, embed_dim)\n\n",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(vocab_size, embed_dim)\n\n"
        ],
        [
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\nclass DropModels:\n    def reset_embeddings(self, embeddings):\n        if self.untie_weights:\n            self.embeddings = layers.",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\nclass DropModels:\n    def reset_embeddings(self, embeddings):\n        if self.untie_weights:\n            self.embeddings = layers."
        ],
        [
            "nn.MaxPool2d(2, stride=2)\n\n",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPool2d(2, stride=2)\n\n"
        ],
        [
            "self.bn1 = nn.BatchNorm2d(ngf*2)\nself.act1 = torch.nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(ngf, ngf*2, 3, 1)\nself.pool1 = nn.MaxPool2d(n_s, stride=s_s)\n\nself.dim //= 2\nself.d_z //= 2\n\nself.z_update = ZUpdate(\n    lambda z, x: z + self.",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm2d(ngf*2)\nself.act1 = torch.nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(ngf, ngf*2, 3, 1)\nself.pool1 = nn.MaxPool2d(n_s, stride=s_s)\n\nself.dim //= 2\nself.d_z //= 2\n\nself.z_update = ZUpdate(\n    lambda z, x: z + self."
        ],
        [
            "self.bn1 = transforms.FirstBatchNorm(model_dim)\nself.act1 = transforms.FirstReLU()\nself.conv1 = transforms.FirstConv2D(num_channels)\nself.pool1 = transforms.FirstAvgPool2d(2, 2)\n\nfor layer in self[1:]:\n\n    #################\n    # BatchNorm\n    #################\n\n    if isinstance(layer, tf.keras.layers.BatchNormalization):\n        layer._enter_mode(training)\n\n",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "self.bn1 = transforms.FirstBatchNorm(model_dim)\nself.act1 = transforms.FirstReLU()\nself.conv1 = transforms.FirstConv2D(num_channels)\nself.pool1 = transforms.FirstAvgPool2d(2, 2)\n\nfor layer in self[1:]:\n\n    #################\n    # BatchNorm\n    #################\n\n    if isinstance(layer, tf.keras.layers.BatchNormalization):\n        layer._enter_mode(training)\n\n"
        ],
        [
            "nn.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "torch.cat(states, dim=-1)",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "cat(states, dim=-1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "F.softmax(input, dim=, dtype=None)\n\n",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "softmax(input, dim=, dtype=None)\n\n"
        ],
        [
            "torch.reshape(x, [batch_size, -1])\n\n",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "reshape(x, [batch_size, -1])\n\n"
        ],
        [
            "nn.MultiheadAttention(model_dim, num_heads, attn_dropout) or MyMultiheadAttention(model_dim, num_heads, attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiheadAttention(model_dim, num_heads, attn_dropout) or MyMultiheadAttention(model_dim, num_heads, attn_dropout)"
        ],
        [
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.GroupNorm(args.d_model, args.d_model)\n\n###########################################################################\n\nclass DecoderBlock(layers.Layer):\n###########################################################################\n\tdef __init__(self, args, d_model, d_ff, n_heads, max_len, dropout):\n\t\tsuper(DecoderBlock, self).__init",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.GroupNorm(args.d_model, args.d_model)\n\n###########################################################################\n\nclass DecoderBlock(layers.Layer):\n###########################################################################\n\tdef __init__(self, args, d_model, d_ff, n_heads, max_len, dropout):\n\t\tsuper(DecoderBlock, self).__init"
        ],
        [
            "\n",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "\n"
        ],
        [
            "return F.log_softmax(x, dim=-1)\n\n'''",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "return F.log_softmax(x, dim=-1)\n\n'''"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "\n",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "\n"
        ],
        [
            "y = self.ffn2(torch.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\nself.attn = layers.MultiHeadAttention(key_dim=model_dim)\nself.dim_red = layers.Dense(",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            "y = self.ffn2(torch.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\nself.attn = layers.MultiHeadAttention(key_dim=model_dim)\nself.dim_red = layers.Dense("
        ],
        [
            "self.bn1 = nn.BatchNorm1d(dim)\nself.conv1 = nn.Conv2d(dim, dim, 3, padding=1, bias=False)\nself.pool1 = nn.MaxPool2d(3, stride=2)\n\nself.bn1 = nn.BatchNorm1d(dim)\nself.act1 = act()\n\nself.conv1 = nn.Con",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm1d(dim)\nself.conv1 = nn.Conv2d(dim, dim, 3, padding=1, bias=False)\nself.pool1 = nn.MaxPool2d(3, stride=2)\n\nself.bn1 = nn.BatchNorm1d(dim)\nself.act1 = act()\n\nself.conv1 = nn.Con"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "nn.MaxPool2d(3, stride=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPool2d(3, stride=2)"
        ],
        [
            "\n # embeddings to vec tf/idf  <===== maybe here !\n\n ",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "\n # embeddings to vec tf/idf  <===== maybe here !\n\n "
        ]
    ],
    [
        [
            "nn.ReLU()",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU()"
        ],
        [
            "nn.Dropout2d(0.1)",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout2d(0.1)"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "nn.Embedding(n_vocab, embed_dim) # n_vocab => vocab_size (see the input example above)",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(n_vocab, embed_dim) # n_vocab => vocab_size (see the input example above)"
        ],
        [
            "self.embed_tokens = nn.Embedding(n_words, dim_emb, padding_idx=act_constants.PAD_ID)\nself.embed_positions\nself.word_dropout\nself.embed_scale\n\nself.emb_layer_norm\n\nself.",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "self.embed_tokens = nn.Embedding(n_words, dim_emb, padding_idx=act_constants.PAD_ID)\nself.embed_positions\nself.word_dropout\nself.embed_scale\n\nself.emb_layer_norm\n\nself."
        ],
        [
            "nn.MaxPool2d(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPool2d(2, 2)"
        ],
        [
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\nfor d in ['/gpu:0', '/gpu:1', '/gpu:2']:\n    with tf.device(d):\n        # construct the graph\n        a = tf.constant([1.0, 2.0, 3",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\nfor d in ['/gpu:0', '/gpu:1', '/gpu:2']:\n    with tf.device(d):\n        # construct the graph\n        a = tf.constant([1.0, 2.0, 3"
        ],
        [
            "self.conv1 = nn.Conv2d(3, num_channels, kernel_size=3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\ndef __init__(self, noise_sigma):\n    super(HGD_class, self).__init__()\n    self.bn = nn.BatchNorm1d(nf, affine=False)\n    self.lrelu = nn.LeakyReLU()\n    self.add_linear\n   ",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "self.conv1 = nn.Conv2d(3, num_channels, kernel_size=3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\ndef __init__(self, noise_sigma):\n    super(HGD_class, self).__init__()\n    self.bn = nn.BatchNorm1d(nf, affine=False)\n    self.lrelu = nn.LeakyReLU()\n    self.add_linear\n   "
        ],
        [
            "nn.LeakyReLU(leaky)",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(leaky)"
        ],
        [
            "torch.cat(states, dim=-1)",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "cat(states, dim=-1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "F.softmax(logits, dim=-1)",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "softmax(logits, dim=-1)"
        ],
        [
            "torch.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "nn.MultiheadAttention(embed_dim=num_heads, attn_dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiheadAttention(embed_dim=num_heads, attn_dropout=attn_dropout)"
        ],
        [
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, args.dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, args.dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)"
        ],
        [
            "\n",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "\n"
        ],
        [
            "return F.log_softmax(x, dim=-1)\n\n######################################################################\n\n### Refs\n\n- https://machinelearningmastery.com/how-to-enable-cuda-for-the-ker",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "return F.log_softmax(x, dim=-1)\n\n######################################################################\n\n### Refs\n\n- https://machinelearningmastery.com/how-to-enable-cuda-for-the-ker"
        ],
        [
            "\n",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "\n"
        ],
        [
            "\n        if n % args.valid_every == 0:   # do evaluation and",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "\n        if n % args.valid_every == 0:   # do evaluation and"
        ],
        [
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\nprint(\"Test successful!\")",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\nprint(\"Test successful!\")"
        ],
        [
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, stride=2)\n\nself.conv2 = ConvBNReLU(in_c, c, groups=in_c)\nself.pool2 = nn.Sequential(OrderedDict([(\"pool\", n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, stride=2)\n\nself.conv2 = ConvBNReLU(in_c, c, groups=in_c)\nself.pool2 = nn.Sequential(OrderedDict([(\"pool\", n"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "nn.MaxPool2d(3, stride=2)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPool2d(3, stride=2)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ]
    ],
    [
        [
            "nn.ReLU()",
            "nn.ReLU()",
            "layers.ReLU()",
            "# Translate Keras to PyTorch\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.",
            "ReLU()"
        ],
        [
            "nn.Dropout(0.1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "nn.Dropout(0.1)",
            "layers.Dropout(0.1)",
            "# Translate Keras to PyTorch\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.",
            "Dropout(0.1)\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "x = F.relu(self.fc(x))",
            "x = tf.nn.relu(self.fc(x))",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "nn.Embedding(vocab_size, embed_dim)",
            "nn.Embedding(vocab_size, embed_dim)",
            "layers.Embedding(vocab_size, embed_dim)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.",
            "Embedding(vocab_size, embed_dim)"
        ],
        [
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb, max_len)\n\n#######################\n\ndef test_switch(v1, v2, cond):\n    # switch\uff0cKeras shape=[batch_size, dim_",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)",
            "max_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\n",
            "max_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb, max_len)\n\n#######################\n\ndef test_switch(v1, v2, cond):\n    # switch\uff0cKeras shape=[batch_size, dim_"
        ],
        [
            "nn.MaxPool2d(2, 2)",
            "nn.MaxPool2d(2, 2)",
            "layers.MaxPooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.",
            "MaxPool2d(2, 2)"
        ],
        [
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = F.leaky_relu(self.bn1, negative_slope=0.2)\nself.conv1 = nn.Conv2d(dim, dim, kernel_size=3)\nself.pool1 = nn.MaxPool2d((3, 2))\n\ndef get_self_attn_weights(self, x):\n    pos_emb = self.r_emb[0]\n    h = self.drop1(self.",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = F.leaky_relu(self.bn1, negative_slope=0.2)\nself.conv1 = nn.Conv2d(dim, dim, kernel_size=3)\nself.pool1 = nn.MaxPool2d((3, 2))\n\ndef get_self_attn_weights(self, x):\n    pos_emb = self.r_emb[0]\n    h = self.drop1(self."
        ],
        [
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, kernel_size=3)\nself.pool1 = nn.AvgPool2d(kernel_size=2)\n\nself.bn2 = nn.BatchNorm2d(num_channels)\nself.act2 = nn.ReLU()\nself.conv2 = n",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, 3)\nself.pool1 = nn.AvgPool2d(2, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.ReLU()\nself.conv1 = layers.Conv2D(num_channels, 3)\nself.pool1 = layers.AveragePooling2D(2, 2)\n# PyTorch\n",
            "self.bn1 = nn.BatchNorm2d(num_channels)\nself.act1 = nn.ReLU()\nself.conv1 = nn.Conv2d(num_channels, num_channels, kernel_size=3)\nself.pool1 = nn.AvgPool2d(kernel_size=2)\n\nself.bn2 = nn.BatchNorm2d(num_channels)\nself.act2 = nn.ReLU()\nself.conv2 = n"
        ],
        [
            "nn.LeakyReLU(args.leaky)",
            "nn.LeakyReLU(args.leaky)",
            "layers.LeakyReLU(args.leaky)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.",
            "LeakyReLU(args.leaky)"
        ],
        [
            "torch.cat(states, dim=-1)",
            "torch.cat(states, dim=-1)",
            "tf.concat(states, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.",
            "cat(states, dim=-1)"
        ],
        [
            "F.log_softmax(logits, dim=-1)",
            "F.log_softmax(logits, dim=-1)",
            "tf.nn.log_softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.",
            "log_softmax(logits, dim=-1)"
        ],
        [
            "F.softmax(logits, dim=-1)",
            "F.softmax(logits, dim=-1)",
            "tf.nn.softmax(logits, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.",
            "softmax(logits, dim=-1)"
        ],
        [
            "torch.reshape(x, [batch_size, -1])",
            "torch.reshape(x, [batch_size, -1])",
            "tf.reshape(x, [batch_size, -1])",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.",
            "reshape(x, [batch_size, -1])"
        ],
        [
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, attn_dropout=attn_dropout)",
            "nn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "layers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.",
            "MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, attn_dropout=attn_dropout)"
        ],
        [
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)",
            "self.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\nx = self.layer1(x)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.LeakyReLU(args.leaky)\n# PyTorch\nnn.LeakyReLU(args.leaky)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = layers.LeakyReLU(0.2)\nself.conv1 = layers.Conv2D(dim, 3)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = nn.LeakyReLU(0.2)\nself.conv1 = nn.Conv2d(dim, dim, 3)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\n",
            "self.attn = MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)"
        ],
        [
            "\n",
            "self.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))",
            "self.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\n",
            "\n"
        ],
        [
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\nself.bn1 = nn.modules.batchnorm(_input)\n\n\nself._in_shape = shape  ",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)",
            "x = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\n",
            "x = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\nself.bn1 = nn.modules.batchnorm(_input)\n\n\nself._in_shape = shape  "
        ],
        [
            "\n",
            "z = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)",
            "z = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\nself.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\n",
            "\n"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "x = self.layer1(x)",
            "x = self.layer1(x)",
            "# Translate Keras to PyTorch\n\n# Keras\nx = self.classifier(x)\nreturn tf.nn.log_softmax(x, axis=-1)\n# PyTorch\nx = self.classifier(x)\nreturn F.log_softmax(x, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nx = self.layer1(x)\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "out = torch.nn.ReLU()(self.feed_forward(norm(x)))\nx = x + self.drop(out)\n\n\n\nif __name__ == '__main__':\n\n    TRG_VOCAB_SIZE = 6000\n    TRG_EMBED_SIZE =",
            "y = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "y = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)",
            "# Translate Keras to PyTorch\n\n# Keras\nlayers.Embedding(vocab_size, embed_dim)\n# PyTorch\nnn.Embedding(vocab_size, embed_dim)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.MaxPool2d(kernel_size=3, stride=2)\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\n",
            "out = torch.nn.ReLU()(self.feed_forward(norm(x)))\nx = x + self.drop(out)\n\n\n\nif __name__ == '__main__':\n\n    TRG_VOCAB_SIZE = 6000\n    TRG_EMBED_SIZE ="
        ],
        [
            "self.bn1 = torch.nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = nn.Conv2d(dim, dim, 3, padding=1, bias=True)\nself.pool1 = nn.MaxPool2d(3, stride=2)\n\nkwargs = {'bn_roll': True, 'bn_prelu': True}\n\nmodels.compile()",
            "self.bn1 = nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = nn.MaxPool2d(3, 2)",
            "self.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.softmax(logits, axis=-1)\n# PyTorch\nF.softmax(logits, dim=-1)\n\n# Keras\nself.rnn = (layers.LSTM(d_model) if rnn_type == 'LSTM' else layers.GRU(d_model))\n# PyTorch\nself.rnn = (nn.LSTM(d_model, d_model) if rnn_type == 'LSTM' else nn.GRU(d_model, d_model))\n\n# Keras\nz = tf.concat([tf.reshape(x, [bsz, -1]), tf.reshape(y, [bsz, -1])], axis=1)\n# PyTorch\nz = torch.cat([torch.reshape(x, [bsz, -1]), torch.reshape(y, [bsz, -1])], dim=1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nself.bn1 = layers.BatchNormalization()\nself.act1 = activation()\nself.conv1 = conv3x3(dim)\nself.pool1 = layers.MaxPooling2D(3, 2)\n# PyTorch\n",
            "self.bn1 = torch.nn.BatchNorm2d(dim)\nself.act1 = activation()\nself.conv1 = nn.Conv2d(dim, dim, 3, padding=1, bias=True)\nself.pool1 = nn.MaxPool2d(3, stride=2)\n\nkwargs = {'bn_roll': True, 'bn_prelu': True}\n\nmodels.compile()"
        ],
        [
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "self.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nx = tf.nn.relu(self.fc(x))\n# PyTorch\nx = F.relu(self.fc(x))\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\nself.fc = CustomLinear(dim)\n\n# Keras\nlayers.MaxPooling2D(2, 2)\n# PyTorch\nnn.MaxPool2d(2, 2)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\n",
            "\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n"
        ],
        [
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "nn.MaxPool2d(kernel_size=3, stride=2)",
            "layers.MaxPooling2D(pool_size=3, strides=2)",
            "# Translate Keras to PyTorch\n\n# Keras\nself.attn = layers.MultiHeadAttention(args.n_heads, args.d_model, dropout=args.att_dropout)\nself.drop1 = layers.Dropout(args.dropout)\nself.norm1 = layers.LayerNormalization(args.d_model)\n# PyTorch\nself.attn = nn.MultiheadAttention(args.d_model, args.n_heads, dropout=args.att_dropout)\nself.drop1 = nn.Dropout(args.dropout)\nself.norm1 = nn.LayerNorm(args.d_model)\n\n# Keras\nlayers.MultiHeadAttention(key_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n# PyTorch\nnn.MultiheadAttention(embed_dim=model_dim, num_heads=num_heads, dropout=attn_dropout)\n\n# Keras\ny = self.ffn2(tf.nn.relu(self.ffn1(x)))\nx = x + self.drop(y)\n# PyTorch\ny = self.ffn2(F.relu(self.ffn1(x)))\nx = x + self.drop(y)\n\n# Keras\ntf.reshape(x, [batch_size, -1])\n# PyTorch\ntorch.reshape(x, [batch_size, -1])\n\n# Keras\nmax_len = 512\nself.embed_tokens = layers.Embedding(n_words, dim_emb, input_length=max_len)\n# PyTorch\nmax_len = 512\nself.embed_tokens = nn.Embedding(n_words, dim_emb)\n\n# Keras\nlayers.MaxPooling2D(pool_size=3, strides=2)\n# PyTorch\nnn.",
            "MaxPool2d(kernel_size=3, stride=2)"
        ],
        [
            "\n",
            "self.fc = CustomLinear(dim)",
            "self.fc = CustomLinear(dim)",
            "# Translate Keras to PyTorch\n\n# Keras\ntf.nn.log_softmax(logits, axis=-1)\n# PyTorch\nF.log_softmax(logits, dim=-1)\n\n# Keras\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n# PyTorch\nself.layer_1 = BasicConv2D(planes, kernel=3, stride=1, dilation=2)\n\n# Keras\nlayers.ReLU()\n# PyTorch\nnn.ReLU()\n\n# Keras\nlayers.Dropout(0.1)\n# PyTorch\nnn.Dropout(0.1)\n\n# Keras\ntf.concat(states, axis=-1)\n# PyTorch\ntorch.cat(states, dim=-1)\n\n# Keras\nself.fc = CustomLinear(dim)\n# PyTorch\n",
            "\n"
        ]
    ]
]