Spaces:

alecrem
/

middleschool

Running

App Files Files Community

Alejandro Cremades commited on Sep 23, 2023

Commit

6ca52a1

•

1 Parent(s): 5fd242f

Black format notebook

Browse files

Files changed (1) hide show

middleschool-cardlist.ipynb +83 -72

middleschool-cardlist.ipynb CHANGED Viewed

@@ -112,31 +112,28 @@
     "    cards = json.loads(json_data.read())\n",
     "\n",
     "# Create a pandas DataFrame with all cards from all legal sets\n",
-    "column_names = ['oracle_id', 'name', 'name_ja']\n",
     "middleschool_df = pd.DataFrame(columns=column_names)\n",
     "for card in cards:\n",
-    "    oracle_id = card['identifiers']['scryfallOracleId']\n",
-    "    name = card['name']\n",
-    "    lang_ja = [lang for lang in card['foreignData']\n",
-    "               if lang['language'] == 'Japanese']\n",
     "    # Some cards do not have a Japanese name\n",
-    "    if (len(lang_ja) > 0):\n",
-    "        name_ja = lang_ja[0]['name']\n",
     "    else:\n",
     "        name_ja = None\n",
-    "    temporary_df = pd.DataFrame({\n",
-    "        'oracle_id': [oracle_id],\n",
-    "        'name':      [name],\n",
-    "        'name_ja':   [name_ja]\n",
-    "    })\n",
     "    middleschool_df = pd.concat([middleschool_df, temporary_df])\n",
     "\n",
     "# For cards with multiple occurrences, put the rows that have the Japanese name on top\n",
-    "middleschool_df = middleschool_df.sort_values(by=['name', 'name_ja'])\n",
     "# For cards with multiple occurrences, delete all rows except for the top one\n",
-    "middleschool_df = middleschool_df.drop_duplicates(subset=['oracle_id'])\n",
-    "print(middleschool_df.shape[0], 'cards found')\n",
-    "print('These are the first and last 5 cards')\n",
     "print(middleschool_df.head())\n",
     "print(middleschool_df.tail())\n"
    ]
@@ -146,7 +143,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Remove Japanese card names that are wrong on MTGJSON"
    ]
   },
   {
@@ -186,13 +183,23 @@
     }
    ],
    "source": [
-    "wrongnames = ['Aether Barrier', 'Aether Burst', 'Aether Charge', 'Aether Flash', 'Aether Mutation',\n",
-    "              'Aether Sting', 'Aether Storm', 'Aether Tide', 'Tainted Aether', 'Tar Pit Warrior']\n",
-    "print('Before:')\n",
-    "print(middleschool_df.loc[middleschool_df['name'].isin(wrongnames)])\n",
-    "middleschool_df.loc[middleschool_df['name'].isin(wrongnames), 'name_ja'] = None\n",
-    "print('After:')\n",
-    "print(middleschool_df.loc[middleschool_df['name'].isin(wrongnames)])\n"
    ]
   },
   {
@@ -200,7 +207,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Find Japanese names for cards that were not released in Japanese in Middle School legal sets"
    ]
   },
   {
@@ -225,14 +232,15 @@
    "source": [
     "import time\n",
     "from requests_html import HTMLSession\n",
     "session = HTMLSession()\n",
     "\n",
     "\n",
     "def find_japanese_name(name):\n",
-    "    url = 'http://whisper.wisdom-guild.net/card/' + name + '/'\n",
     "    r = session.get(url)\n",
     "    # Find the text on the <title> element in the HTML document\n",
-    "    title = r.html.find('title')[0].text\n",
     "    # Find the position of the English card name within the title\n",
     "    idx = title.find(name)\n",
     "    # The Japanese name should be before the English name,\n",
@@ -241,7 +249,7 @@
     "        return None\n",
     "    # If the exact English card name can't be found, we look for a '/'\n",
     "    if idx == -1:\n",
-    "        idx = title.find('/')\n",
     "        # No '/' means no Japanese name\n",
     "        if idx == -1:\n",
     "            return None\n",
@@ -249,17 +257,18 @@
     "        name_ja = title[0:idx]\n",
     "    else:\n",
     "        # Take only the Japanese name from the title\n",
-    "        name_ja = title[0:idx - 1]\n",
     "    return name_ja\n",
     "\n",
     "\n",
-    "english_only_cards = middleschool_df[middleschool_df['name_ja'].isnull()]\n",
-    "name_list = english_only_cards['name'].to_list()\n",
     "for idx, name in enumerate(name_list):\n",
-    "    middleschool_df.loc[middleschool_df['name'] ==\n",
-    "                        name, 'name_ja'] = find_japanese_name(name)\n",
     "    # print(middleschool_df.loc[middleschool_df['name'] == name])\n",
-    "    print('.', end='')\n",
     "    if idx % 80 == 79:\n",
     "        print()\n",
     "    time.sleep(1)\n"
@@ -270,7 +279,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Exclude all cards banned in Middle School"
    ]
   },
   {
@@ -289,44 +298,46 @@
     }
    ],
    "source": [
-    "banlist = [\"Amulet of Quoz\",\n",
-    "           \"Balance\",\n",
-    "           \"Brainstorm\",\n",
-    "           \"Bronze Tablet\",\n",
-    "           \"Channel\",\n",
-    "           \"Dark Ritual\",\n",
-    "           \"Demonic Consultation\",\n",
-    "           \"Flash\",\n",
-    "           \"Goblin Recruiter\",\n",
-    "           \"Imperial Seal\",\n",
-    "           \"Jeweled Bird\",\n",
-    "           \"Mana Crypt\",\n",
-    "           \"Mana Vault\",\n",
-    "           \"Memory Jar\",\n",
-    "           \"Mind's Desire\",\n",
-    "           \"Mind Twist\",\n",
-    "           \"Rebirth\",\n",
-    "           \"Strip Mine\",\n",
-    "           \"Tempest Efreet\",\n",
-    "           \"Timmerian Fiends\",\n",
-    "           \"Tolarian Academy\",\n",
-    "           \"Vampiric Tutor\",\n",
-    "           \"Windfall\",\n",
-    "           \"Yawgmoth's Bargain\",\n",
-    "           \"Yawgmoth's Will\"]\n",
-    "print('Cards legal by set:', middleschool_df.shape[0])\n",
     "# Find the rows with the banned cards\n",
-    "banned_df = middleschool_df[pd.DataFrame(\n",
-    "    middleschool_df.name.tolist()).isin(banlist).any(axis=1).values]\n",
-    "print('Banned cards:', banned_df.shape[0])\n",
     "# Append the banned cards to the main Middle School DataFrame,\n",
     "# then remove any rows that appear twice,\n",
     "# effectively leaving only the legal cards\n",
-    "middleschool_df = pd.concat(\n",
-    "    [middleschool_df, banned_df]).drop_duplicates(keep=False)\n",
-    "print('Cards legal by set and not banned:', middleschool_df.shape[0])\n",
     "middleschool_df = middleschool_df.reset_index(drop=True)\n",
-    "middleschool_df = middleschool_df[['oracle_id', 'name', 'name_ja']]\n"
    ]
   },
   {
@@ -343,8 +354,8 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "middleschool_df.to_csv('output/middleschool.csv')\n",
-    "middleschool_df.to_json('output/middleschool.json')\n"
    ]
   },
   {
@@ -352,7 +363,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Feel free to delete everything in the `data` directory after you are done"
    ]
   }
  ],
@@ -372,7 +383,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.11.3"
   },
   "orig_nbformat": 4,
   "vscode": {

     "    cards = json.loads(json_data.read())\n",
     "\n",
     "# Create a pandas DataFrame with all cards from all legal sets\n",
+    "column_names = [\"oracle_id\", \"name\", \"name_ja\"]\n",
     "middleschool_df = pd.DataFrame(columns=column_names)\n",
     "for card in cards:\n",
+    "    oracle_id = card[\"identifiers\"][\"scryfallOracleId\"]\n",
+    "    name = card[\"name\"]\n",
+    "    lang_ja = [lang for lang in card[\"foreignData\"] if lang[\"language\"] == \"Japanese\"]\n",
     "    # Some cards do not have a Japanese name\n",
+    "    if len(lang_ja) > 0:\n",
+    "        name_ja = lang_ja[0][\"name\"]\n",
     "    else:\n",
     "        name_ja = None\n",
+    "    temporary_df = pd.DataFrame(\n",
+    "        {\"oracle_id\": [oracle_id], \"name\": [name], \"name_ja\": [name_ja]}\n",
+    "    )\n",
     "    middleschool_df = pd.concat([middleschool_df, temporary_df])\n",
     "\n",
     "# For cards with multiple occurrences, put the rows that have the Japanese name on top\n",
+    "middleschool_df = middleschool_df.sort_values(by=[\"name\", \"name_ja\"])\n",
     "# For cards with multiple occurrences, delete all rows except for the top one\n",
+    "middleschool_df = middleschool_df.drop_duplicates(subset=[\"oracle_id\"])\n",
+    "print(middleschool_df.shape[0], \"cards found\")\n",
+    "print(\"These are the first and last 5 cards\")\n",
     "print(middleschool_df.head())\n",
     "print(middleschool_df.tail())\n"
    ]
    "cell_type": "markdown",
    "metadata": {},
    "source": [
+    "Remove Japanese card names that are wrong on MTGJSON\n"
    ]
   },
   {
     }
    ],
    "source": [
+    "wrongnames = [\n",
+    "    \"Aether Barrier\",\n",
+    "    \"Aether Burst\",\n",
+    "    \"Aether Charge\",\n",
+    "    \"Aether Flash\",\n",
+    "    \"Aether Mutation\",\n",
+    "    \"Aether Sting\",\n",
+    "    \"Aether Storm\",\n",
+    "    \"Aether Tide\",\n",
+    "    \"Tainted Aether\",\n",
+    "    \"Tar Pit Warrior\",\n",
+    "]\n",
+    "print(\"Before:\")\n",
+    "print(middleschool_df.loc[middleschool_df[\"name\"].isin(wrongnames)])\n",
+    "middleschool_df.loc[middleschool_df[\"name\"].isin(wrongnames), \"name_ja\"] = None\n",
+    "print(\"After:\")\n",
+    "print(middleschool_df.loc[middleschool_df[\"name\"].isin(wrongnames)])\n"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
+    "Find Japanese names for cards that were not released in Japanese in Middle School legal sets\n"
    ]
   },
   {
    "source": [
     "import time\n",
     "from requests_html import HTMLSession\n",
+    "\n",
     "session = HTMLSession()\n",
     "\n",
     "\n",
     "def find_japanese_name(name):\n",
+    "    url = \"http://whisper.wisdom-guild.net/card/\" + name + \"/\"\n",
     "    r = session.get(url)\n",
     "    # Find the text on the <title> element in the HTML document\n",
+    "    title = r.html.find(\"title\")[0].text\n",
     "    # Find the position of the English card name within the title\n",
     "    idx = title.find(name)\n",
     "    # The Japanese name should be before the English name,\n",
     "        return None\n",
     "    # If the exact English card name can't be found, we look for a '/'\n",
     "    if idx == -1:\n",
+    "        idx = title.find(\"/\")\n",
     "        # No '/' means no Japanese name\n",
     "        if idx == -1:\n",
     "            return None\n",
     "        name_ja = title[0:idx]\n",
     "    else:\n",
     "        # Take only the Japanese name from the title\n",
+    "        name_ja = title[0 : idx - 1]\n",
     "    return name_ja\n",
     "\n",
     "\n",
+    "english_only_cards = middleschool_df[middleschool_df[\"name_ja\"].isnull()]\n",
+    "name_list = english_only_cards[\"name\"].to_list()\n",
     "for idx, name in enumerate(name_list):\n",
+    "    middleschool_df.loc[\n",
+    "        middleschool_df[\"name\"] == name, \"name_ja\"\n",
+    "    ] = find_japanese_name(name)\n",
     "    # print(middleschool_df.loc[middleschool_df['name'] == name])\n",
+    "    print(\".\", end=\"\")\n",
     "    if idx % 80 == 79:\n",
     "        print()\n",
     "    time.sleep(1)\n"
    "cell_type": "markdown",
    "metadata": {},
    "source": [
+    "Exclude all cards banned in Middle School\n"
    ]
   },
   {
     }
    ],
    "source": [
+    "banlist = [\n",
+    "    \"Amulet of Quoz\",\n",
+    "    \"Balance\",\n",
+    "    \"Brainstorm\",\n",
+    "    \"Bronze Tablet\",\n",
+    "    \"Channel\",\n",
+    "    \"Dark Ritual\",\n",
+    "    \"Demonic Consultation\",\n",
+    "    \"Flash\",\n",
+    "    \"Goblin Recruiter\",\n",
+    "    \"Imperial Seal\",\n",
+    "    \"Jeweled Bird\",\n",
+    "    \"Mana Crypt\",\n",
+    "    \"Mana Vault\",\n",
+    "    \"Memory Jar\",\n",
+    "    \"Mind's Desire\",\n",
+    "    \"Mind Twist\",\n",
+    "    \"Rebirth\",\n",
+    "    \"Strip Mine\",\n",
+    "    \"Tempest Efreet\",\n",
+    "    \"Timmerian Fiends\",\n",
+    "    \"Tolarian Academy\",\n",
+    "    \"Vampiric Tutor\",\n",
+    "    \"Windfall\",\n",
+    "    \"Yawgmoth's Bargain\",\n",
+    "    \"Yawgmoth's Will\",\n",
+    "]\n",
+    "print(\"Cards legal by set:\", middleschool_df.shape[0])\n",
     "# Find the rows with the banned cards\n",
+    "banned_df = middleschool_df[\n",
+    "    pd.DataFrame(middleschool_df.name.tolist()).isin(banlist).any(axis=1).values\n",
+    "]\n",
+    "print(\"Banned cards:\", banned_df.shape[0])\n",
     "# Append the banned cards to the main Middle School DataFrame,\n",
     "# then remove any rows that appear twice,\n",
     "# effectively leaving only the legal cards\n",
+    "middleschool_df = pd.concat([middleschool_df, banned_df]).drop_duplicates(keep=False)\n",
+    "print(\"Cards legal by set and not banned:\", middleschool_df.shape[0])\n",
     "middleschool_df = middleschool_df.reset_index(drop=True)\n",
+    "middleschool_df = middleschool_df[[\"oracle_id\", \"name\", \"name_ja\"]]\n"
    ]
   },
   {
    "metadata": {},
    "outputs": [],
    "source": [
+    "middleschool_df.to_csv(\"output/middleschool.csv\")\n",
+    "middleschool_df.to_json(\"output/middleschool.json\")\n"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
+    "Feel free to delete everything in the `data` directory after you are done\n"
    ]
   }
  ],
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
+   "version": "3.11.4"
   },
   "orig_nbformat": 4,
   "vscode": {