updates

gbaydin · gbaydin · commit f3291e601c16 · 2021-04-23T02:17:45.000+01:00
diff --git a/kessler/__init__.py b/kessler/__init__.py
@@ -9,7 +9,8 @@
 # GNU General Public License version 3. See LICENSE in root of repository.
 
 
-__version__ = '0.1.2.dev2'
+__version__ = '0.1.2.dev3'
 
+from .util import seed
 from .cdm import ConjunctionDataMessage, CDM
 from .event import Event, EventDataset
diff --git a/kessler/data.py b/kessler/data.py
@@ -8,47 +8,14 @@
 #
 # GNU General Public License version 3. See LICENSE in root of repository.
 
-
-import uuid
-import os
-import torch
 import pandas as pd
 from datetime import datetime, timedelta
 
 from . import util
-from .models import Conjunction
 from .cdm import CDM
 from .event import Event, EventDataset
 
 
-def generate_event_dataset(dataset_dir, num_events, save_traces=False, verbosity=True, *args, **kwargs):
-    model = Conjunction(*args, **kwargs)
-    if verbosity:
-        print('Generating CDM dataset')
-        print('Directory: {}'.format(dataset_dir))
-
-    util.create_path(dataset_dir, directory=True)
-    for i in range(num_events):
-        if verbosity:
-            print('Generating event {} / {}'.format(i+1, num_events))
-        file_name_event = os.path.join(dataset_dir, 'event_{}'.format(str(uuid.uuid4())))
-
-        trace = model.get_conjunction()
-        if save_traces:
-            file_name_trace = file_name_event + '.trace'
-            if verbosity:
-                print('Saving trace: {}'.format(file_name_trace))
-            torch.save(trace, file_name_trace)
-
-        cdms = trace['cdms']
-        for j, cdm in enumerate(cdms):
-            file_name_suffix = '{}'.format(j).rjust(len('{}'.format(len(cdms))), '0')
-            file_name_cdm = file_name_event + '_{}.cdm.kvn.txt'.format(file_name_suffix)
-            if verbosity:
-                print('Saving cdm  : {}'.format(file_name_cdm))
-            cdm.save(file_name_cdm)
-
-
 def kelvins_to_event_dataset(file_name, num_events=None, date_tca=None, remove_outliers=True, drop_features=['c_rcs_estimate', 't_rcs_estimate']):
     print('Loading Kelvins dataset from file name: {}'.format(file_name))
     kelvins = pd.read_csv(file_name)
diff --git a/kessler/event.py b/kessler/event.py
@@ -19,7 +19,6 @@
 import re
 
 from . import util
-from .cdm import ConjunctionDataMessage
 from .cdm import CDM
 
 mpl.rcParams['axes.unicode_minus'] = False
@@ -33,7 +32,7 @@ def __init__(self, cdms=None, cdm_file_names=None):
                 raise RuntimeError('Expecting only one of cdms, cdm_file_names, not both')
             self._cdms = cdms
         elif cdm_file_names is not None:
-            self._cdms = [ConjunctionDataMessage(file_name) for file_name in cdm_file_names]
+            self._cdms = [CDM(file_name) for file_name in cdm_file_names]
         else:
             self._cdms = []
         self._update_cdm_extra_features()
@@ -48,7 +47,7 @@ def _update_cdm_extra_features(self):
                 cdm._values_extra['__DAYS_TO_TCA'] = cdm._values_extra['__TCA'] - cdm._values_extra['__CREATION_DATE']
 
     def add(self, cdm, return_result=False):
-        if isinstance(cdm, ConjunctionDataMessage):
+        if isinstance(cdm, CDM):
             self._cdms.append(cdm)
         elif isinstance(cdm, list):
             for c in cdm:
diff --git a/kessler/nn.py b/kessler/nn.py
@@ -216,7 +216,7 @@ def learn(self, event_set, epochs=2, lr=1e-3, batch_size=8, device='cpu', valid_
                 self._hist_train_loss_iters.append(total_iters)
                 self._hist_train_loss.append(train_loss)
 
-                print('iter {} | minibatch {}/{} | epoch {}/{} | train loss {:.4e} | valid loss {:.4e}'.format(total_iters, i_minibatch+1, len(train_loader), epoch+1, epochs, train_loss, valid_loss), end='\r')
+                print('iter {} | minibatch {}/{} | epoch {}/{} | train loss {:.4e} | valid loss {:.4e}  '.format(total_iters, i_minibatch+1, len(train_loader), epoch+1, epochs, train_loss, valid_loss), end='\r')
                 sys.stdout.flush()
 
             if file_name_prefix is not None:
@@ -233,7 +233,7 @@ def predict(self, event):
         self.reset(1)
         output = self.forward(input.unsqueeze(0), input_length.unsqueeze(0)).squeeze()
         if util.has_nan_or_inf(output):
-            raise RuntimeError('Network output has nan or inf:\n'.format(output))
+            raise RuntimeError('Network output has nan or inf: {}\n'.format(output))
         if output.ndim == 1:
             output_last = output
         else:
diff --git a/kessler/util.py b/kessler/util.py
@@ -20,11 +20,27 @@
 import skyfield.sgp4lib
 import datetime
 import functools
+import random
 
 
 _print_refresh_rate = 0.25  #
 
 
+def seed(seed=None):
+    if seed is None:
+        seed = int((time.time()*1e6) % 1e8)
+    global _random_seed
+    _random_seed = seed
+    random.seed(seed)
+    np.random.seed(seed)
+    torch.manual_seed(seed)
+    if torch.cuda.is_available():
+        torch.cuda.manual_seed(seed)
+
+
+seed()
+
+
 # This function is from python-sgp4 released under MIT License, (c) 2012–2016 Brandon Rhodes
 def compute_checksum(line):
     return sum((int(c) if c.isdigit() else c == '-') for c in line[0:68]) % 10
diff --git a/notebooks/001_get_started.ipynb b/notebooks/001_get_started.ipynb
@@ -3,21 +3,21 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "micro-minneapolis",
    "metadata": {},
    "outputs": [],
    "source": [
     "import kessler\n",
     "from kessler import EventDataset\n",
     "from kessler.nn import LSTMPredictor\n",
     "from kessler.data import kelvins_to_event_dataset\n",
+    "import pandas as pd\n",
     "\n",
-    "import pandas as pd"
+    "# Set the random number generator seed for reproducibility\n",
+    "kessler.seed(1)"
    ]
   },
   {
    "cell_type": "markdown",
-   "id": "flexible-algorithm",
    "metadata": {},
    "source": [
     "# Data Loading\n",
@@ -28,21 +28,19 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "ahead-beach",
    "metadata": {},
    "outputs": [],
    "source": [
     "#As an example, we first show the case in which the data comes from the Kelvins competition.\n",
     "#For this, we built a specific converter that takes care of the conversion from Kelvins format\n",
     "#to standard CDM format (the data can be downloaded at https://kelvins.esa.int/collision-avoidance-challenge/data/):\n",
-    "file_name = 'path_to_csv/train_data.csv'\n",
-    "events = kelvins_to_event_dataset(file_name, drop_features=['c_rcs_estimate', 't_rcs_estimate'], num_events=200) #we use only 200 events"
+    "file_name = '/home/gunes/data/kelvins/train_data/train_data.csv'\n",
+    "events = kelvins_to_event_dataset(file_name, drop_features=['c_rcs_estimate', 't_rcs_estimate'], num_events=1000) #we use only 200 events"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "formed-recognition",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -55,7 +53,6 @@
   },
   {
    "cell_type": "markdown",
-   "id": "weekly-baltimore",
    "metadata": {},
    "source": [
     "# Descriptive Statistics"
@@ -64,7 +61,6 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "demonstrated-clothing",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -75,7 +71,6 @@
   },
   {
    "cell_type": "markdown",
-   "id": "upper-columbus",
    "metadata": {},
    "source": [
     "# LSTM Training"
@@ -84,7 +79,6 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "intense-massage",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -98,7 +92,6 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "norman-value",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -117,17 +110,20 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "corporate-gardening",
    "metadata": {},
    "outputs": [],
    "source": [
     "# Create an LSTM predictor, specialized to the nn_features we extracted above\n",
-    "model = LSTMPredictor(features=nn_features)\n",
+    "model = LSTMPredictor(\n",
+    "            lstm_size=256,  # Number of hidden units per LSTM layer\n",
+    "            lstm_depth=2,  # Number of stacked LSTM layers\n",
+    "            dropout=0.2,  # Dropout probability\n",
+    "            features=nn_features)  # The list of feature names to use in the LSTM\n",
     "\n",
     "# Start training\n",
     "model.learn(events_train_and_val, \n",
-    "            epochs=3, # Number of epochs (one epoch is one full pass through the training dataset)\n",
-    "            lr=1e-4, # Learning rate, can decrease it if training diverges\n",
+    "            epochs=10, # Number of epochs (one epoch is one full pass through the training dataset)\n",
+    "            lr=1e-3, # Learning rate, can decrease it if training diverges\n",
     "            batch_size=16, # Minibatch size, can be decreased if there are issues with memory use\n",
     "            device='cpu', # Can be 'cuda' if there is a GPU available\n",
     "            valid_proportion=0.15, # Proportion of the data to use as a validation set internally\n",
@@ -138,7 +134,6 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "egyptian-yemen",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -149,7 +144,6 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "alert-furniture",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -160,7 +154,6 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "compressed-democracy",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -171,7 +164,6 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "contemporary-professional",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -187,7 +179,6 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "collected-chaos",
    "metadata": {},
    "outputs": [],
    "source": [
@@ -200,83 +191,13 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "grateful-billion",
    "metadata": {},
    "outputs": [],
    "source": [
     "#we now plot the uncertainty prediction for all the covariance matrix elements of both OBJECT1 and OBJECT2:\n",
     "axs = event_evolution.plot_uncertainty(return_axs=True, linewidth=0.5, label='Prediction', alpha=0.5, color='red', legend=True, diagonal=False)\n",
     "event.plot_uncertainty(axs=axs, label='Real', diagonal=False)"
    ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "graphic-impression",
-   "metadata": {},
-   "source": [
-    "# Plotting loop over all the events & CDMs\n",
-    "You can here customize the features to be plotted: we use relative speed, miss distance, and a covariance value:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "going-memory",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "#we loop over the test set events:\n",
-    "predict_full_event=False\n",
-    "for i in range(0,len(events_test)):\n",
-    "    event=events_test[i]\n",
-    "    len_ev=len(event)\n",
-    "    for j in range(1,len_ev):\n",
-    "        #print(j)\n",
-    "        if predict_full_event:\n",
-    "            event_evolution = model.predict_event(event[0:j],num_samples=10)\n",
-    "        else:\n",
-    "            event_evolution = model.predict_event_step(event[0:j],num_samples=10)\n",
-    "\n",
-    "        #we plot the features (ground truth & prediction)\n",
-    "        axs_1 = event_evolution.plot_features(['RELATIVE_SPEED', 'MISS_DISTANCE', 'OBJECT1_CT_T'], return_axs=True, linewidth=0.1, color='red', alpha=0.33, label='Prediction')\n",
-    "        event.plot_features(['RELATIVE_SPEED', 'MISS_DISTANCE', 'OBJECT1_CT_T'], axs=axs_1, label='Real', legend=True,file_name=f'features_event_{i}_cdm_{j}.pdf')\n",
-    "        #we plot the uncertainties (ground truth & prediction)\n",
-    "        axs_2 = event_evolution.plot_uncertainty(return_axs=True, linewidth=0.5, label='Prediction', alpha=0.5, color='red', legend=True, diagonal=False)\n",
-    "        event.plot_uncertainty(axs=axs_2, label='Real', diagonal=False, file_name=f'uncertainties_event_{i}_cdm_{j}.pdf')"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "actual-effectiveness",
-   "metadata": {},
-   "source": [
-    "# Training set test\n",
-    "We check if the model is able to predict the CDMs on the training set"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "enclosed-europe",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "#we loop over some training set events, to check the NN performances:\n",
-    "num_events=10\n",
-    "for i in range(0,num_events):\n",
-    "    event=events_train_and_val[i]\n",
-    "    len_ev=len(event)\n",
-    "    for j in range(1,len_ev):\n",
-    "        print(j)\n",
-    "        event_evolution = model.predict_event(event[0:j],num_samples=10)\n",
-    "        #we plot the features (ground truth & prediction)\n",
-    "        axs_1 = event_evolution.plot_features(['RELATIVE_SPEED', 'MISS_DISTANCE', 'OBJECT1_CT_T'], return_axs=True, linewidth=0.1, color='red', alpha=0.33, label='Prediction')\n",
-    "        event.plot_features(['RELATIVE_SPEED', 'MISS_DISTANCE', 'OBJECT1_CT_T'], axs=axs_1, label='Real', legend=True,file_name=f'training_set_features_event_{i}_cdm_{j}.pdf')\n",
-    "        #we plot the uncertainties (ground truth & prediction)\n",
-    "        axs_2 = event_evolution.plot_uncertainty(return_axs=True, linewidth=0.5, label='Prediction', alpha=0.5, color='red', legend=True, diagonal=False)\n",
-    "        event.plot_uncertainty(axs=axs_2, label='Real', diagonal=False, file_name=f'training_set_uncertainties_event_{i}_cdm_{j}.pdf')"
-   ]
   }
  ],
  "metadata": {
@@ -295,7 +216,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.9"
+   "version": "3.8.5"
   }
  },
  "nbformat": 4,