{
  "cells": [
    {
      "cell_type": "code",
      "execution_count": 1,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "jchu4w0rZ7wn",
        "outputId": "47e39352-8579-448c-f867-81036990c0db"
      },
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "Collecting google-play-scraper\n",
            "  Downloading google_play_scraper-1.2.7-py3-none-any.whl.metadata (50 kB)\n",
            "\u001b[?25l     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/50.2 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m50.2/50.2 kB\u001b[0m \u001b[31m2.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hDownloading google_play_scraper-1.2.7-py3-none-any.whl (28 kB)\n",
            "Installing collected packages: google-play-scraper\n",
            "Successfully installed google-play-scraper-1.2.7\n",
            "Collecting app-store-scraper\n",
            "  Downloading app_store_scraper-0.3.5-py3-none-any.whl.metadata (5.1 kB)\n",
            "Collecting requests==2.23.0 (from app-store-scraper)\n",
            "  Downloading requests-2.23.0-py2.py3-none-any.whl.metadata (6.8 kB)\n",
            "Collecting chardet<4,>=3.0.2 (from requests==2.23.0->app-store-scraper)\n",
            "  Downloading chardet-3.0.4-py2.py3-none-any.whl.metadata (3.2 kB)\n",
            "Collecting idna<3,>=2.5 (from requests==2.23.0->app-store-scraper)\n",
            "  Downloading idna-2.10-py2.py3-none-any.whl.metadata (9.1 kB)\n",
            "Collecting urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 (from requests==2.23.0->app-store-scraper)\n",
            "  Downloading urllib3-1.25.11-py2.py3-none-any.whl.metadata (41 kB)\n",
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m41.1/41.1 kB\u001b[0m \u001b[31m2.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hRequirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.12/dist-packages (from requests==2.23.0->app-store-scraper) (2025.8.3)\n",
            "Downloading app_store_scraper-0.3.5-py3-none-any.whl (8.3 kB)\n",
            "Downloading requests-2.23.0-py2.py3-none-any.whl (58 kB)\n",
            "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m58.4/58.4 kB\u001b[0m \u001b[31m2.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hDownloading chardet-3.0.4-py2.py3-none-any.whl (133 kB)\n",
            "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m133.4/133.4 kB\u001b[0m \u001b[31m6.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hDownloading idna-2.10-py2.py3-none-any.whl (58 kB)\n",
            "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m58.8/58.8 kB\u001b[0m \u001b[31m3.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hDownloading urllib3-1.25.11-py2.py3-none-any.whl (127 kB)\n",
            "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m128.0/128.0 kB\u001b[0m \u001b[31m9.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
            "\u001b[?25hInstalling collected packages: chardet, urllib3, idna, requests, app-store-scraper\n",
            "  Attempting uninstall: chardet\n",
            "    Found existing installation: chardet 5.2.0\n",
            "    Uninstalling chardet-5.2.0:\n",
            "      Successfully uninstalled chardet-5.2.0\n",
            "  Attempting uninstall: urllib3\n",
            "    Found existing installation: urllib3 2.5.0\n",
            "    Uninstalling urllib3-2.5.0:\n",
            "      Successfully uninstalled urllib3-2.5.0\n",
            "  Attempting uninstall: idna\n",
            "    Found existing installation: idna 3.10\n",
            "    Uninstalling idna-3.10:\n",
            "      Successfully uninstalled idna-3.10\n",
            "  Attempting uninstall: requests\n",
            "    Found existing installation: requests 2.32.4\n",
            "    Uninstalling requests-2.32.4:\n",
            "      Successfully uninstalled requests-2.32.4\n",
            "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n",
            "google-colab 1.0.0 requires requests==2.32.4, but you have requests 2.23.0 which is incompatible.\n",
            "google-adk 1.14.1 requires requests<3.0.0,>=2.32.4, but you have requests 2.23.0 which is incompatible.\n",
            "google-genai 1.38.0 requires requests<3.0.0,>=2.28.1, but you have requests 2.23.0 which is incompatible.\n",
            "libpysal 4.13.0 requires requests>=2.27, but you have requests 2.23.0 which is incompatible.\n",
            "tiktoken 0.11.0 requires requests>=2.26.0, but you have requests 2.23.0 which is incompatible.\n",
            "yfinance 0.2.66 requires requests>=2.31, but you have requests 2.23.0 which is incompatible.\n",
            "sphinx 8.2.3 requires requests>=2.30.0, but you have requests 2.23.0 which is incompatible.\n",
            "datasets 4.0.0 requires requests>=2.32.2, but you have requests 2.23.0 which is incompatible.\n",
            "distributed 2025.5.0 requires urllib3>=1.26.5, but you have urllib3 1.25.11 which is incompatible.\n",
            "sentry-sdk 2.38.0 requires urllib3>=1.26.11, but you have urllib3 1.25.11 which is incompatible.\n",
            "tweepy 4.16.0 requires requests<3,>=2.27.0, but you have requests 2.23.0 which is incompatible.\n",
            "bigframes 2.21.0 requires requests>=2.27.1, but you have requests 2.23.0 which is incompatible.\n",
            "opentelemetry-resourcedetector-gcp 1.9.0a0 requires requests~=2.24, but you have requests 2.23.0 which is incompatible.\u001b[0m\u001b[31m\n",
            "\u001b[0mSuccessfully installed app-store-scraper-0.3.5 chardet-3.0.4 idna-2.10 requests-2.23.0 urllib3-1.25.11\n"
          ]
        }
      ],
      "source": [
        "!pip install google-play-scraper\n",
        "!pip install app-store-scraper"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "from google_play_scraper import reviews_all, Sort\n",
        "import pandas as pd\n",
        "\n",
        "# List of App IDs\n",
        "app_ids = [\n",
        "    #Learning, Game & Editing Apps\n",
        "    \"com.studysmarter\",\n",
        "    \"com.wonder\",\n",
        "    \"com.alison.mobile.flutter\",\n",
        "    \"com.letterschool.lite\",\n",
        "    \"com.atistudios.mondly.languages\",\n",
        "    \"com.cyberlink.youperfect\",\n",
        "    \"photocollage.photoeditor.collagemaker\",\n",
        "    \"com.magicv.airbrush\",\n",
        "    \"com.cyberlink.photodirector\",\n",
        "    \"com.vsco.cam\",\n",
        "    \"com.namcobandaigames.pacmantournaments\",\n",
        "    \"com.matteljv.uno\",\n",
        "    \"com.os.airforce\",\n",
        "    \"com.generagames.resistance\",\n",
        "    \"com.gameloft.android.ANMP.GloftM5HM\",\n",
        "    \"com.duolingo\",\n",
        "    \"com.a10minuteschool.tenminuteschool\",\n",
        "    \"tech.shikho.android\",\n",
        "    \"com.getmimo\",\n",
        "    \"com.sololearn\",\n",
        "    \"com.byjus.thelearningapp\",\n",
        "    \"org.khankids.android\",\n",
        "    \"com.kids.learn.reading.app\",\n",
        "    \"com.udemy.android\",\n",
        "    \"org.coursera.android\",\n",
        "    \"com.niksoftware.snapseed\",\n",
        "    \"com.picsart.studio\",\n",
        "    \"com.lemon.lvoverseas\",\n",
        "    \"com.adobe.lrmobile\",\n",
        "    \"com.camerasideas.instashot\",\n",
        "    \"com.bigwinepot.nwdn.international\",\n",
        "    \"com.adsk.sketchbook\",\n",
        "    \"photo.editor.photoeditor.photoeditorpro\",\n",
        "    \"com.canva.editor\",\n",
        "    \"com.nexstreaming.app.kinemasterfree\",\n",
        "    \"com.kiloo.subwaysurf\",\n",
        "    \"com.imangi.templerun\",\n",
        "    \"com.outfit7.mytalkingangelafree\",\n",
        "    \"com.miniclip.carrom\",\n",
        "    \"com.king.candycrushsaga\",\n",
        "    \"com.halfbrick.fruitninjafree\",\n",
        "    \"com.ludo.king\",\n",
        "    \"com.fgol.HungrySharkEvolution\",\n",
        "    \"com.supercell.clashofclans\",\n",
        "    \"com.fingersoft.hcr2\"\n",
        "]\n",
        "\n",
        "# Initialize empty DataFrame\n",
        "all_reviews = pd.DataFrame()\n",
        "\n",
        "# Loop through each app and collect reviews\n",
        "for app_id in app_ids:\n",
        "    print(f\"Fetching reviews for {app_id} ...\")\n",
        "    try:\n",
        "        g_reviews = reviews_all(\n",
        "            app_id,\n",
        "            sleep_milliseconds=0,\n",
        "            lang='en',\n",
        "            country='us',\n",
        "            sort=Sort.NEWEST,\n",
        "        )\n",
        "\n",
        "        # Convert reviews to DataFrame\n",
        "        g_df = pd.DataFrame(g_reviews)\n",
        "\n",
        "        # Drop unnecessary columns\n",
        "        g_df.drop(columns={'userImage', 'reviewCreatedVersion', 'replyContent', 'repliedAt'}, inplace=True, errors='ignore')\n",
        "\n",
        "        # Rename columns\n",
        "        g_df.rename(columns={\n",
        "            'score': 'rating',\n",
        "            'userName': 'user_name',\n",
        "            'reviewId': 'review_id',\n",
        "            'content': 'review_description',\n",
        "            'at': 'review_date',\n",
        "            'thumbsUpCount': 'thumbs_up'\n",
        "        }, inplace=True)\n",
        "\n",
        "        # Add extra columns\n",
        "        g_df['source'] = 'Google Play'\n",
        "        g_df['review_title'] = ''\n",
        "        g_df['language_code'] = 'en'\n",
        "        g_df['country_code'] = 'us'\n",
        "        g_df['app_id'] = app_id  # <-- Add app identifier\n",
        "\n",
        "        # Append to main DataFrame\n",
        "        all_reviews = pd.concat([all_reviews, g_df], ignore_index=True)\n",
        "\n",
        "    except Exception as e:\n",
        "        print(f\"Error fetching {app_id}: {e}\")\n",
        "\n",
        "# Save to CSV\n",
        "csv_filename = \"Google Play Store Review Dataset Raw.csv\"\n",
        "all_reviews.to_csv(csv_filename, index=False, encoding=\"utf-8\")\n",
        "print(f\"✅ All reviews saved to {csv_filename}\")\n"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "zL5DpfmuHta9",
        "outputId": "23c508a5-36a0-42c9-828b-e9ff0bc66acf"
      },
      "execution_count": 6,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "✅ All reviews saved to Google Play Store Review Dataset Raw.csv\n"
          ]
        }
      ]
    }
  ],
  "metadata": {
    "colab": {
      "provenance": []
    },
    "kernelspec": {
      "display_name": "Python 3",
      "name": "python3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}