linted

jnolis · jnolis · commit cc2cbe5a2491 · 2021-03-17T14:44:01.000-07:00
diff --git a/examples/pytorch/01-start-with-pytorch.ipynb b/examples/pytorch/01-start-with-pytorch.ipynb
@@ -28,18 +28,16 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "import pandas as pd\n",
-    "import uuid\n",
+    "import uuid # noqa\n",
     "import datetime\n",
-    "import pickle\n",
+    "import pickle # noqa\n",
     "import json\n",
-    "import torch\n",
-    "import math\n",
+    "import torch # noqa\n",
     "import torch.nn as nn\n",
     "import torch.optim as optim\n",
     "import numpy as np\n",
     "import urllib.request\n",
-    "import time\n",
+    "import pandas as pd # noqa\n",
     "from torch.utils.data import Dataset, DataLoader"
    ]
   },
@@ -65,44 +63,47 @@
     "characters = list(\"*+abcdefghijklmnopqrstuvwxyz-. \")\n",
     "str_len = 8\n",
     "\n",
+    "\n",
     "def format_training_data(pet_names, device=None):\n",
     "    def get_substrings(in_str):\n",
     "        # add the stop character to the end of the name, then generate all the partial names\n",
     "        in_str = in_str + \"+\"\n",
     "        res = [in_str[0: j] for j in range(1, len(in_str) + 1)]\n",
     "        return res\n",
-    "    pet_names_expanded = [get_substrings(name) for name in  pet_names]\n",
+    "    pet_names_expanded = [get_substrings(name) for name in pet_names]\n",
     "    pet_names_expanded = [item for sublist in pet_names_expanded for item in sublist]\n",
     "    pet_names_characters = [list(name) for name in pet_names_expanded]\n",
     "    pet_names_padded = [name[-(str_len + 1):] for name in pet_names_characters]\n",
-    "    pet_names_padded = [list((str_len + 1- len(characters)) * \"*\") + characters for characters in pet_names_padded]\n",
+    "    pet_names_padded = [list((str_len + 1 - len(characters)) * \"*\") + characters for characters in pet_names_padded]\n",
     "    pet_names_numeric = [[characters.index(char) for char in name] for name in pet_names_padded]\n",
     "\n",
     "    # the final x and y data to use for training the model. Note that the x data needs to be one-hot encoded\n",
     "    if device is None:\n",
     "        y = torch.tensor([name[1:] for name in pet_names_numeric])\n",
     "        x = torch.tensor([name[:-1] for name in pet_names_numeric])\n",
     "    else:\n",
-    "        y = torch.tensor([name[1:] for name in pet_names_numeric], device = device)\n",
-    "        x = torch.tensor([name[:-1] for name in pet_names_numeric], device = device)\n",
-    "    x = torch.nn.functional.one_hot(x, num_classes = len(characters)).float()\n",
+    "        y = torch.tensor([name[1:] for name in pet_names_numeric], device=device)\n",
+    "        x = torch.tensor([name[:-1] for name in pet_names_numeric], device=device)\n",
+    "    x = torch.nn.functional.one_hot(x, num_classes=len(characters)).float()\n",
     "    return x, y\n",
     "\n",
+    "\n",
     "class OurDataset(Dataset):\n",
     "    def __init__(self, pet_names, device=None):\n",
     "        self.x, self.y = format_training_data(pet_names, device)\n",
     "        self.permute()\n",
-    "        \n",
+    "\n",
     "    def __getitem__(self, idx):\n",
     "        idx = self.permutation[idx]\n",
     "        return self.x[idx], self.y[idx]\n",
-    "    \n",
+    "\n",
     "    def __len__(self):\n",
     "        return len(self.x)\n",
-    "    \n",
+    "\n",
     "    def permute(self):\n",
     "        self.permutation = torch.randperm(len(self.x))\n",
     "\n",
+    "\n",
     "class Model(nn.Module):\n",
     "    def __init__(self):\n",
     "        super(Model, self).__init__()\n",
@@ -115,6 +116,7 @@
     "            dropout=0.1,\n",
     "        )\n",
     "        self.fc = nn.Linear(self.lstm_size, len(characters))\n",
+    "\n",
     "    def forward(self, x):\n",
     "        output, state = self.lstm(x)\n",
     "        logits = self.fc(output)\n",
@@ -138,21 +140,21 @@
     "def train():\n",
     "    device = torch.device(0)\n",
     "\n",
-    "    dataset = OurDataset(pet_names, device = device)\n",
-    "    loader = DataLoader(dataset, batch_size=batch_size,shuffle=True, num_workers=0)\n",
-    "    \n",
+    "    dataset = OurDataset(pet_names, device=device)\n",
+    "    loader = DataLoader(dataset, batch_size=batch_size, shuffle=True, num_workers=0)\n",
+    "\n",
     "    model = Model()\n",
     "    model = model.to(device)\n",
-    "    \n",
+    "\n",
     "    criterion = nn.CrossEntropyLoss()\n",
     "    optimizer = optim.Adam(model.parameters(), lr=0.001)\n",
-    "    \n",
+    "\n",
     "    for epoch in range(num_epochs):\n",
     "        dataset.permute()\n",
     "        for i, (batch_x, batch_y) in enumerate(loader):\n",
     "            optimizer.zero_grad()\n",
     "            batch_y_pred = model(batch_x)\n",
-    "            \n",
+    "\n",
     "            loss = criterion(batch_y_pred.transpose(1, 2), batch_y)\n",
     "            loss.backward()\n",
     "            optimizer.step()\n",
@@ -206,21 +208,21 @@
     "        in_progress_name_padded = in_progress_name[-str_len:]\n",
     "        in_progress_name_padded = list((str_len - len(in_progress_name_padded)) * \"*\") + in_progress_name_padded\n",
     "        in_progress_name_numeric = [characters.index(char) for char in in_progress_name_padded]\n",
-    "        in_progress_name_tensor = torch.tensor(in_progress_name_numeric, device = device)\n",
-    "        in_progress_name_tensor = torch.nn.functional.one_hot(in_progress_name_tensor, num_classes = len(characters)).float()\n",
+    "        in_progress_name_tensor = torch.tensor(in_progress_name_numeric, device=device)\n",
+    "        in_progress_name_tensor = torch.nn.functional.one_hot(in_progress_name_tensor, num_classes=len(characters)).float()\n",
     "        in_progress_name_tensor = torch.unsqueeze(in_progress_name_tensor, 0)\n",
-    "        \n",
+    "\n",
     "        # get the probabilities of each possible next character by running the model\n",
     "        with torch.no_grad():\n",
     "            next_letter_probabilities = model(in_progress_name_tensor)\n",
-    "        \n",
-    "        next_letter_probabilities = next_letter_probabilities[0,-1,:]\n",
+    "\n",
+    "        next_letter_probabilities = next_letter_probabilities[0, -1, :]\n",
     "        next_letter_probabilities = torch.nn.functional.softmax(next_letter_probabilities, dim=0).detach().cpu().numpy()\n",
     "        next_letter_probabilities = next_letter_probabilities[1:]\n",
-    "        next_letter_probabilities = [p/sum(next_letter_probabilities) for p in next_letter_probabilities]\n",
-    "        \n",
+    "        next_letter_probabilities = [p / sum(next_letter_probabilities) for p in next_letter_probabilities]\n",
+    "\n",
     "        # determine what the actual letter is\n",
-    "        next_letter = characters[np.random.choice(len(characters)-1, p=next_letter_probabilities) + 1]\n",
+    "        next_letter = characters[np.random.choice(len(characters) - 1, p=next_letter_probabilities) + 1]\n",
     "        if(next_letter != \"+\"):\n",
     "            # if the next character isn't stop add the latest generated character to the name and continue\n",
     "            in_progress_name.append(next_letter)\n",
@@ -243,7 +245,7 @@
    "outputs": [],
    "source": [
     "# Generate 50 names then filter out existing ones\n",
-    "generated_names = [generate_name(model, characters, str_len) for i in range(0,50)]\n",
+    "generated_names = [generate_name(model, characters, str_len) for i in range(0, 50)]\n",
     "generated_names = [name for name in generated_names if name not in pet_names]\n",
     "print(generated_names)"
    ]
diff --git a/examples/pytorch/02-start-with-dask.ipynb b/examples/pytorch/02-start-with-dask.ipynb
@@ -47,7 +47,7 @@
    "source": [
     "@dask.delayed\n",
     "def lazy_exponent(args):\n",
-    "    x,y = args\n",
+    "    x, y = args\n",
     "    '''Define a lazily evaluating function'''\n",
     "    return x ** y"
    ]
@@ -65,7 +65,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "inputs = [[1,2], [3,4], [5,6], [9, 10], [11, 12]]\n",
+    "inputs = [[1, 2], [3, 4], [5, 6], [9, 10], [11, 12]]\n",
     "\n",
     "example_future = client.map(lazy_exponent, inputs)\n",
     "futures_gathered = client.gather(example_future)\n",
diff --git a/examples/pytorch/03-start-with-pytorch-dask-multiple-models.ipynb b/examples/pytorch/03-start-with-pytorch-dask-multiple-models.ipynb
@@ -22,18 +22,16 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "import pandas as pd\n",
-    "import uuid\n",
-    "import datetime\n",
-    "import pickle\n",
-    "import json\n",
-    "import torch\n",
-    "import math\n",
-    "import torch.nn as nn\n",
-    "import torch.optim as optim\n",
-    "import numpy as np\n",
-    "import urllib.request\n",
-    "import time\n",
+    "import uuid # noqa\r\n",
+    "import datetime\r\n",
+    "import pickle # noqa\r\n",
+    "import json\r\n",
+    "import torch\r\n",
+    "import torch.nn as nn\r\n",
+    "import torch.optim as optim\r\n",
+    "import numpy as np # noqa\r\n",
+    "import urllib.request\r\n",
+    "import pandas as pd\r\n",
     "from torch.utils.data import Dataset, DataLoader"
    ]
   },
@@ -52,44 +50,47 @@
     "characters = list(\"*+abcdefghijklmnopqrstuvwxyz-. \")\n",
     "str_len = 8\n",
     "\n",
+    "\n",
     "def format_training_data(pet_names, device=None):\n",
     "    def get_substrings(in_str):\n",
     "        # add the stop character to the end of the name, then generate all the partial names\n",
     "        in_str = in_str + \"+\"\n",
     "        res = [in_str[0: j] for j in range(1, len(in_str) + 1)]\n",
     "        return res\n",
-    "    pet_names_expanded = [get_substrings(name) for name in  pet_names]\n",
+    "    pet_names_expanded = [get_substrings(name) for name in pet_names]\n",
     "    pet_names_expanded = [item for sublist in pet_names_expanded for item in sublist]\n",
     "    pet_names_characters = [list(name) for name in pet_names_expanded]\n",
     "    pet_names_padded = [name[-(str_len + 1):] for name in pet_names_characters]\n",
-    "    pet_names_padded = [list((str_len + 1- len(characters)) * \"*\") + characters for characters in pet_names_padded]\n",
+    "    pet_names_padded = [list((str_len + 1 - len(characters)) * \"*\") + characters for characters in pet_names_padded]\n",
     "    pet_names_numeric = [[characters.index(char) for char in name] for name in pet_names_padded]\n",
     "\n",
     "    # the final x and y data to use for training the model. Note that the x data needs to be one-hot encoded\n",
     "    if device is None:\n",
     "        y = torch.tensor([name[1:] for name in pet_names_numeric])\n",
     "        x = torch.tensor([name[:-1] for name in pet_names_numeric])\n",
     "    else:\n",
-    "        y = torch.tensor([name[1:] for name in pet_names_numeric], device = device)\n",
-    "        x = torch.tensor([name[:-1] for name in pet_names_numeric], device = device)\n",
-    "    x = torch.nn.functional.one_hot(x, num_classes = len(characters)).float()\n",
+    "        y = torch.tensor([name[1:] for name in pet_names_numeric], device=device)\n",
+    "        x = torch.tensor([name[:-1] for name in pet_names_numeric], device=device)\n",
+    "    x = torch.nn.functional.one_hot(x, num_classes=len(characters)).float()\n",
     "    return x, y\n",
     "\n",
+    "\n",
     "class OurDataset(Dataset):\n",
     "    def __init__(self, pet_names, device=None):\n",
     "        self.x, self.y = format_training_data(pet_names, device)\n",
     "        self.permute()\n",
-    "        \n",
+    "\n",
     "    def __getitem__(self, idx):\n",
     "        idx = self.permutation[idx]\n",
     "        return self.x[idx], self.y[idx]\n",
-    "    \n",
+    "\n",
     "    def __len__(self):\n",
     "        return len(self.x)\n",
-    "    \n",
+    "\n",
     "    def permute(self):\n",
     "        self.permutation = torch.randperm(len(self.x))\n",
     "\n",
+    "\n",
     "class Model(nn.Module):\n",
     "    def __init__(self):\n",
     "        super(Model, self).__init__()\n",
@@ -102,6 +103,7 @@
     "            dropout=0.1,\n",
     "        )\n",
     "        self.fc = nn.Linear(self.lstm_size, len(characters))\n",
+    "\n",
     "    def forward(self, x):\n",
     "        output, state = self.lstm(x)\n",
     "        logits = self.fc(output)\n",
@@ -162,28 +164,27 @@
     "    training_start_time = datetime.datetime.now()\n",
     "    device = torch.device(0)\n",
     "\n",
-    "    dataset = OurDataset(pet_names, device = device)\n",
+    "    dataset = OurDataset(pet_names, device=device)\n",
     "    loader = DataLoader(dataset, batch_size=batch_size, shuffle=True, num_workers=0)\n",
-    "    \n",
+    "\n",
     "    model = Model()\n",
     "    model = model.to(device)\n",
-    "    \n",
+    "\n",
     "    criterion = nn.CrossEntropyLoss()\n",
     "    optimizer = optim.Adam(model.parameters(), lr=lr)\n",
-    "    \n",
+    "\n",
     "    results = []\n",
     "\n",
     "    for epoch in range(num_epochs):\n",
     "        dataset.permute()\n",
     "        for i, (batch_x, batch_y) in enumerate(loader):\n",
     "            optimizer.zero_grad()\n",
     "            batch_y_pred = model(batch_x)\n",
-    "            \n",
+    "\n",
     "            loss = criterion(batch_y_pred.transpose(1, 2), batch_y)\n",
     "            loss.backward()\n",
     "            optimizer.step()\n",
     "            logger.info(f\"{datetime.datetime.now().isoformat()} - batch {i} - batch_size {batch_size} - lr {lr} - epoch {epoch} complete - loss {loss.item()}\")\n",
-    "        epoch_end_time = datetime.datetime.now().isoformat()\n",
     "        new_results = {\n",
     "            \"batch_size\": batch_size,\n",
     "            \"lr\": lr,\n",
@@ -210,7 +211,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "inputs = [(4096,0.001), (16384, 0.001), (4096,0.01), (16384, 0.01)]\n",
+    "inputs = [(4096, 0.001), (16384, 0.001), (4096, 0.01), (16384, 0.01)]\n",
     "\n",
     "train_future = client.map(train, inputs)\n",
     "futures_gathered = client.gather(train_future)\n",
diff --git a/examples/pytorch/04-start-with-pytorch-dask-single-model.ipynb b/examples/pytorch/04-start-with-pytorch-dask-single-model.ipynb