{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# IMDB-WIKI Knowledge Graph\n", "\n", "- convert names to Knowledge Graph entity IDs\n", "- The `imdb.mat` file contains only full names, need KG ids `/m/12345`" ] }, { "cell_type": "code", "execution_count": 87, "metadata": {}, "outputs": [], "source": [ "%reload_ext autoreload\n", "%autoreload 2\n", "\n", "import os\n", "import os.path as osp\n", "from os.path import join\n", "from glob import glob\n", "from pathlib import Path\n", "import random\n", "import math\n", "from datetime import datetime\n", "import requests\n", "import json\n", "import time\n", "from pprint import pprint\n", "from multiprocessing.pool import ThreadPool\n", "import threading\n", "import urllib.request\n", "\n", "from tqdm import tqdm_notebook as tqdm\n", "import pandas as pd\n", "from scipy.io import loadmat\n", "import numpy as np\n", "%matplotlib inline\n", "import matplotlib.pyplot as plt" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Load IMDB Metadata" ] }, { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | celeb_id | \n", "dob | \n", "filepath | \n", "gender | \n", "name | \n", "x1 | \n", "x2 | \n", "y1 | \n", "y2 | \n", "year_photo | \n", "
|---|---|---|---|---|---|---|---|---|---|---|
| index | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
| 0 | \n", "6488 | \n", "1900-5-11 | \n", "01/nm0000001_rm124825600_1899-5-10_1968.jpg | \n", "m | \n", "Fred Astaire | \n", "1072.926 | \n", "1214.784 | \n", "161.838 | \n", "303.696 | \n", "1968 | \n", "
| 1 | \n", "6488 | \n", "1900-5-11 | \n", "01/nm0000001_rm3343756032_1899-5-10_1970.jpg | \n", "m | \n", "Fred Astaire | \n", "477.184 | \n", "622.592 | \n", "100.352 | \n", "245.760 | \n", "1970 | \n", "