openml
diff --git a/‎examples/OpenMLDemo.ipynb‎
Lines changed: 11 additions & 18 deletions b/‎examples/OpenMLDemo.ipynb‎
Lines changed: 11 additions & 18 deletions
diff --git a/‎openml/datasets/dataset.py‎
Lines changed: 9 additions & 6 deletions b/‎openml/datasets/dataset.py‎
Lines changed: 9 additions & 6 deletions
@@ -118,7 +118,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "First 10 of 2806 datasets...\n",
+      "First 10 of 2855 datasets...\n",
       "   did             name  NumberOfInstances  NumberOfFeatures\n",
       "0    1           anneal                898                39\n",
       "1    2           anneal                898                39\n",
@@ -274,6 +274,7 @@
       " 'creator': 'R.A. Fisher',\n",
       " 'data_file': '/home/andy/.openml/cache/datasets/61/dataset.arff',\n",
       " 'data_pickle_file': '/home/andy/.openml/cache/datasets/61/dataset.pkl',\n",
+      " 'dataset_id': 61,\n",
       " 'default_target_attribute': 'class',\n",
       " 'description': '**Author**: R.A. Fisher  \\n'\n",
       "                '**Source**: '\n",
@@ -304,7 +305,6 @@
       "                '       -- Iris Versicolour\\n'\n",
       "                '       -- Iris Virginica',\n",
       " 'format': 'ARFF',\n",
-      " 'id': 61,\n",
       " 'ignore_attributes': None,\n",
       " 'language': None,\n",
       " 'licence': 'Public',\n",
@@ -629,7 +629,6 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "2823\n",
       "RandomForest has run on the task.\n"
      ]
     }
@@ -657,24 +656,18 @@
    },
    "outputs": [
     {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Uploaded run with id 538241\n",
-      "Check it at www.openml.org/r/538241\n"
-     ]
+     "data": {
+      "text/plain": [
+       "<openml.runs.run.OpenMLRun at 0x7fb31ecec668>"
+      ]
+     },
+     "execution_count": 17,
+     "metadata": {},
+     "output_type": "execute_result"
     }
    ],
    "source": [
-    "import xmltodict\n",
-    "\n",
-    "return_code, response = run.publish()\n",
-    "\n",
-    "if(return_code == 200):\n",
-    "    response_dict = xmltodict.parse(response)\n",
-    "    run_id = response_dict['oml:upload_run']['oml:run_id']\n",
-    "    print(\"Uploaded run with id %s\" % (run_id))\n",
-    "    print(\"Check it at www.openml.org/r/%s\" % (run_id))"
+    "run.publish()"
    ]
   },
   {
 
@@ -8,6 +8,7 @@
 
 import numpy as np
 import scipy.sparse
+import xmltodict
 
 if sys.version_info[0] >= 3:
     import pickle
@@ -17,6 +18,7 @@
     except:
         import pickle
 
+
 from ..util import is_string
 from .._api_calls import _perform_api_call
 
@@ -36,7 +38,7 @@ class OpenMLDataset(object):
         Description of the dataset
     FIXME : which of these do we actually nee?
     """
-    def __init__(self, id=None, name=None, version=None, description=None,
+    def __init__(self, dataset_id=None, name=None, version=None, description=None,
                  format=None, creator=None, contributor=None,
                  collection_date=None, upload_date=None, language=None,
                  licence=None, url=None, default_target_attribute=None,
@@ -45,7 +47,7 @@ def __init__(self, id=None, name=None, version=None, description=None,
                  original_data_url=None, paper_url=None, update_comment=None,
                  md5_checksum=None, data_file=None):
         # Attributes received by querying the RESTful API
-        self.id = int(id) if id is not None else None
+        self.dataset_id = int(dataset_id) if dataset_id is not None else None
         self.name = name
         self.version = int(version)
         self.description = description
@@ -100,7 +102,7 @@ def __init__(self, id=None, name=None, version=None, description=None,
                 with open(self.data_pickle_file, "wb") as fh:
                     pickle.dump((X, categorical, attribute_names), fh, -1)
                 logger.debug("Saved dataset %d: %s to file %s" %
-                             (self.id, self.name, self.data_pickle_file))
+                             (self.dataset_id, self.name, self.data_pickle_file))
 
     def __eq__(self, other):
         if type(other) != OpenMLDataset:
@@ -281,7 +283,8 @@ def publish(self):
             "/data/", file_dictionary=file_dictionary,
             file_elements=file_elements)
 
-        return return_code, return_value
+        self.dataset_id = int(xmltodict.parse(return_value)['oml:upload_data_set']['oml:id'])
+        return self
 
     def _to_xml(self):
         """Serialize object to xml for upload
@@ -292,7 +295,7 @@ def _to_xml(self):
             XML description of the data.
         """
         xml_dataset = ('<oml:data_set_description '
-                       'xmlns:oml="http://openml.org/openml">')
+                       'xmlns:oml="http://openml.org/openml">\n')
         props = ['id', 'name', 'version', 'description', 'format', 'creator',
                  'contributor', 'collection_date', 'upload_date', 'language',
                  'licence', 'url', 'default_target_attribute',
@@ -302,6 +305,6 @@ def _to_xml(self):
         for prop in props:
             content = getattr(self, prop, None)
             if content is not None:
-                xml_dataset += "<oml:{0}>{1}</oml:{0}>".format(prop, content)
+                xml_dataset += "<oml:{0}>{1}</oml:{0}>\n".format(prop, content)
         xml_dataset += "</oml:data_set_description>"
         return xml_dataset