{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "import sys\n",
    "sys.path.append(os.path.realpath('../..'))\n",
    "from toy.ground_truth import Ground_Truth\n",
    "from toy.data import Input_Dataset\n",
    "from toy.ntk import ReLU_NTK as NTK\n",
    "from toy.ops import f_eff_GD\n",
    "import matplotlib.pyplot as plt\n",
    "from toy.net import Net\n",
    "import torch\n",
    "import numpy as np\n",
    "import re"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "networ_dir = '../../experiment/04/network'\n",
    "epochs = []\n",
    "for s in os.listdir(networ_dir):\n",
    "    if re.match(r'student_epoch-+', s):\n",
    "        epochs.append(int(s[14:]))\n",
    "\n",
    "epochs = np.array(sorted(epochs))\n",
    "print(epochs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "epoch_num = 2\n",
    "device = torch.device('cuda:0')\n",
    "input_dim = 2\n",
    "\n",
    "datanums = np.exp(np.linspace(np.log(10), np.log(10000.1), 100, endpoint=True))[1:].astype(int)\n",
    "\n",
    "\n",
    "dataset = torch.load('../../experiment/04/dataset/train_dataset')\n",
    "\n",
    "with torch.no_grad():\n",
    "    teacher_init_net = torch.load(networ_dir + '/init_net', map_location=device)\n",
    "    teacher = torch.load(networ_dir + '/student_epoch-{:06d}'.format(epochs[epoch_num]), map_location=device)\n",
    "\n",
    "T = 5.0\n",
    "teacher_reduction = 0.2\n",
    "\n",
    "a = 1 - torch.tensor(np.linspace(0.0001, 0.01, 2, endpoint=False))\n",
    "b = 1 - torch.tensor(np.exp(np.linspace(np.log(0.01), np.log(0.3), 4, endpoint=False)))\n",
    "c = 1 - torch.tensor(np.exp(np.linspace(np.log(0.3), np.log(0.99), 2, endpoint=True)))\n",
    "# c = torch.tensor([0.6, 0.5, 0.4, 0.3, 0.2, 0.1, 0.0001], dtype=torch.float64)\n",
    "rhos = torch.cat([a,b,c])\n",
    "fold = 20\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "for rho in rhos:\n",
    "\n",
    "    \n",
    "    temp = []\n",
    "    for i in range(5*fold):\n",
    "        with torch.no_grad():\n",
    "\n",
    "            init_net = Net(input_dim=input_dim, output_dim=1).to(device)\n",
    "\n",
    "            dataset.datanum = 10000\n",
    "            dataset.generate_data()\n",
    "\n",
    "            X = dataset[:][1]\n",
    "            y = teacher_reduction * teacher(X)\n",
    "            y = f_eff_GD(soft_logits=y, hard_labels=(y>0).to(y.dtype), rho=rho, T=T, iter=10000) - init_net(X)\n",
    "            scale = torch.mean(torch.abs(y))\n",
    "            temp.append(scale.item())\n",
    "\n",
    "    scales.append(np.mean(np.array(temp)))\n",
    "\n",
    "    print(rho.item(), scales[-1])\n",
    "\n",
    "scales = np.array(scales)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "tags": [
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend",
     "outputPrepend"
    ]
   },
   "outputs": [],
   "source": [
    "for rho in rhos:\n",
    "    data_0 = []\n",
    "\n",
    "    for datanum in datanums:\n",
    "        data_1 = []\n",
    "\n",
    "        print(rho, datanum)\n",
    "\n",
    "        for i in range(fold):\n",
    "            with torch.no_grad():\n",
    "\n",
    "                init_net = Net(input_dim=input_dim, output_dim=1).to(device)\n",
    "\n",
    "                dataset.datanum = datanum\n",
    "                dataset.generate_data()\n",
    "\n",
    "                X = dataset[:][1]\n",
    "                y = teacher_reduction * teacher(X)\n",
    "                y = f_eff_GD(soft_logits=y, hard_labels=(y>0).to(y.dtype), rho=rho, T=T, iter=100) - init_net(X)\n",
    "            \n",
    "                Theta = NTK(X, weight_std=init_net.weight_std, bias_std=init_net.bias_std, hidden_layer_num=3)\n",
    "\n",
    "                temp, _ = torch.solve(y, Theta)\n",
    "                result = torch.dot(y.squeeze(), temp.squeeze()).item()\n",
    "\n",
    "            if not np.isinf(result):\n",
    "                if result > 0:\n",
    "                    data_1.append(result)\n",
    "\n",
    "        data_0.append(np.mean(np.array(data_1)))\n",
    "\n",
    "    data.append(np.array(data_0))\n",
    "\n",
    "data = np.array(data) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "if not os.path.exists('../../experiment/04c'):\n",
    "    os.makedirs('../../experiment/04c')\n",
    "\n",
    "torch.save(data, '../../experiment/04c/data')\n",
    "torch.save(scales, '../../experiment/04c/scales')"
   ]
  }
 ],
 "metadata": {
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.3-final"
  },
  "orig_nbformat": 2,
  "kernelspec": {
   "name": "python38364bit5172cfd22f324156974f51e47e17b07a",
   "display_name": "Python 3.8.3 64-bit"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}