itziakos
diff --git a/‎.gitattributes‎
Lines changed: 3 additions & 2 deletions b/‎.gitattributes‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎.landscape.yml‎
Lines changed: 5 additions & 0 deletions b/‎.landscape.yml‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎.mailmap‎
Lines changed: 10 additions & 2 deletions b/‎.mailmap‎
Lines changed: 10 additions & 2 deletions
diff --git a/‎.travis.yml‎
Lines changed: 19 additions & 4 deletions b/‎.travis.yml‎
Lines changed: 19 additions & 4 deletions
diff --git a/‎CONTRIBUTING.md‎
Lines changed: 4 additions & 3 deletions b/‎CONTRIBUTING.md‎
Lines changed: 4 additions & 3 deletions
diff --git a/‎COPYING‎
Lines changed: 1 addition & 1 deletion b/‎COPYING‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎Makefile‎
Lines changed: 1 addition & 1 deletion b/‎Makefile‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎README.rst‎
Lines changed: 8 additions & 2 deletions b/‎README.rst‎
Lines changed: 8 additions & 2 deletions
diff --git a/‎appveyor.yml‎
Lines changed: 18 additions & 8 deletions b/‎appveyor.yml‎
Lines changed: 18 additions & 8 deletions
diff --git a/‎benchmarks/bench_20newsgroups.py‎
Lines changed: 97 additions & 0 deletions b/‎benchmarks/bench_20newsgroups.py‎
Lines changed: 97 additions & 0 deletions
@@ -1,9 +1,10 @@
 /sklearn/__check_build/_check_build.c -diff
-/sklearn/_hmmc.c -diff
 /sklearn/_isotonic.c -diff
-/sklearn/cluster/_hierarchical.c -diff
+/sklearn/cluster/_dbscan_inner.cpp -diff
+/sklearn/cluster/_hierarchical.cpp -diff
 /sklearn/cluster/_k_means.c -diff
 /sklearn/datasets/_svmlight_format.c -diff
+/sklearn/decomposition/_online_lda.c -diff
 /sklearn/ensemble/_gradient_boosting.c -diff
 /sklearn/feature_extraction/_hashing.c -diff
 /sklearn/linear_model/cd_fast.c -diff
 
@@ -0,0 +1,5 @@
+pylint:
+  disable:
+    - unpacking-non-sequence
+ignore-paths:
+    - sklearn/externals
@@ -6,6 +6,7 @@ Andreas Mueller <[email protected]> <Andreas [email protected].
 Andreas Mueller <[email protected]> <[email protected]>
 Andreas Mueller <[email protected]> <[email protected]>
 Andreas Mueller <[email protected]> <andy@marvin>
+Andreas Mueller <[email protected]> <[email protected]>
 Arnaud Joly <[email protected]>
 Arnaud Joly <[email protected]> <[email protected]>
 Arnaud Joly <[email protected]> <[email protected]>
@@ -20,6 +21,7 @@ Brian Cheung <[email protected]> <cow@rusty.(none)>
 Brian Holt <[email protected]> <[email protected]>
 Christian Osendorfer <[email protected]>
 Clay Woolam <[email protected]>
+Danny Sullivan <[email protected]> <[email protected]>
 Denis Engemann <[email protected]>
 Denis Engemann <[email protected]> <[email protected]>
 Denis Engemann <[email protected]> <[email protected]>
@@ -60,14 +62,20 @@ Kyle Kastner <[email protected]>
 Lars Buitinck <[email protected]> <Lars@.(none)>
 Lars Buitinck <[email protected]> <[email protected]>
 Lars Buitinck <[email protected]> <[email protected]>
+Lars Buitinck <[email protected]> <[email protected]>
+Lars Buitinck <[email protected]> <[email protected]>
+Loic Esteve <[email protected]>
 Manoj Kumar <[email protected]>
 Matthieu Perrot <[email protected]> <revilyo@earth.(none)>
 Maheshakya Wijewardena <[email protected]>
 Michael Bommarito <[email protected]>
 Michael Eickenberg <[email protected]>
 Michael Eickenberg <[email protected]> <[email protected]>
+Samuel Charron <[email protected]> <[email protected]>
+Sergio Medina <[email protected]> <[email protected]>
 Nelle Varoquaux <[email protected]>
-Nelle Varoquaux <[email protected]> <[email protected]> <nelle@[email protected]>
+Nelle Varoquaux <[email protected]> <[email protected]>
+Nelle Varoquaux <[email protected]> <nelle@[email protected]>
 Nicolas Pinto <[email protected]> <[email protected]>
 Noel Dawe <[email protected]> <[email protected]>
 Noel Dawe <[email protected]> <[email protected]>
@@ -102,4 +110,4 @@ X006 <x006@x006-icsl.(none)> <x006@x006laptop.(none)>
 Xinfan Meng <[email protected]> <[email protected]>
 Yannick Schwartz <[email protected]> <[email protected]>
 Yannick Schwartz <[email protected]> <ys218403@is220245.(none)>
-
+Yannick Schwartz <[email protected]> <[email protected]>
@@ -1,10 +1,18 @@
 language: python
-virtualenv:
-  system_site_packages: true
+# make it explicit that we favor the new container-based travis workers
+sudo: false
+addons:
+  apt:
+    packages:
+      # Only used by the DISTRIB="ubuntu" setting
+      - libatlas3gf-base
+      - libatlas-dev
+      - python-scipy
 env:
   matrix:
-    - DISTRIB="ubuntu" PYTHON_VERSION="2.7" INSTALL_ATLAS="true"
-      COVERAGE="true"
+    # This environment tests that scikit-learn can be built against
+    # versions of numpy, scipy with ATLAS that comes with Ubuntu Precise 12.04
+    - DISTRIB="ubuntu" PYTHON_VERSION="2.7" COVERAGE="true"
     # This environment tests the oldest supported anaconda env
     - DISTRIB="conda" PYTHON_VERSION="2.6" INSTALL_MKL="false"
       NUMPY_VERSION="1.6.2" SCIPY_VERSION="0.11.0"
@@ -19,3 +27,10 @@ after_success:
     # because the coverage report failed to be published.
     - if [[ "$COVERAGE" == "true" ]]; then coveralls || echo "failed"; fi
 cache: apt
+notifications:
+  webhooks:
+    urls:
+      - https://webhooks.gitter.im/e/4ffabb4df010b70cd624
+    on_success: change  # options: [always|never|change] default: always
+    on_failure: always  # options: [always|never|change] default: always
+    on_start: false     # default: false
@@ -22,6 +22,7 @@ GitHub:
 2. Clone this copy to your local disk:
 
           $ git clone [email protected]:YourLogin/scikit-learn.git
+          $ cd scikit-learn
 
 3. Create a branch to hold your changes:
 
@@ -39,9 +40,9 @@ GitHub:
 
           $ git push -u origin my-feature
 
-Finally, go to the web page of the your fork of the scikit-learn repo,
+Finally, go to the web page of your fork of the scikit-learn repo,
 and click 'Pull request' to send your changes to the maintainers for
-review. request. This will send an email to the committers.
+review. This will send an email to the committers.
 
 (If any of the above seems like magic to you, then look up the 
 [Git documentation](http://git-scm.com/documentation) on the web.)
@@ -64,7 +65,7 @@ following rules before submitting a pull request:
    to other methods available in scikit-learn.
 
 -  At least one paragraph of narrative documentation with links to
-````   references in the literature (with PDF links when possible) and
+   references in the literature (with PDF links when possible) and
    the example.
 
 The documentation should also include expected time and space
 
@@ -1,6 +1,6 @@
 New BSD License
 
-Copyright (c) 2007–2014 The scikit-learn developers.
+Copyright (c) 2007–2015 The scikit-learn developers.
 All rights reserved.
 
 
 
@@ -47,7 +47,7 @@ cython:
 ctags:
 	# make tags for symbol based navigation in emacs and vim
 	# Install with: sudo apt-get install exuberant-ctags
-	$(CTAGS) -R *
+	$(CTAGS) --python-kinds=-i -R sklearn
 
 doc: inplace
 	$(MAKE) -C doc html
 
@@ -1,10 +1,16 @@
 .. -*- mode: rst -*-
 
-|Travis|_
+|Travis|_ |AppVeyor|_ |Coveralls|_
 
 .. |Travis| image:: https://api.travis-ci.org/scikit-learn/scikit-learn.png?branch=master
 .. _Travis: https://travis-ci.org/scikit-learn/scikit-learn
 
+.. |AppVeyor| image:: https://ci.appveyor.com/api/projects/status/github/scikit-learn/scikit-learn?branch=master&svg=true
+.. _AppVeyor: https://ci.appveyor.com/project/sklearn-ci/scikit-learn/history
+
+.. |Coveralls| image:: https://coveralls.io/repos/scikit-learn/scikit-learn/badge.svg?branch=master
+.. _Coveralls: https://coveralls.io/r/scikit-learn/scikit-learn
+
 scikit-learn
 ============
 
@@ -38,7 +44,7 @@ scikit-learn is tested to work under Python 2.6, Python 2.7, and Python 3.4.
 (using the same codebase thanks to an embedded copy of
 `six <http://pythonhosted.org/six/>`_). It should also work with Python 3.3.
 
-The required dependencies to build the software are NumPy >= 1.6.2,
+The required dependencies to build the software are NumPy >= 1.6.1,
 SciPy >= 0.9 and a working C/C++ compiler.
 
 For running the examples Matplotlib >= 1.1.1 is required and for running the
 
@@ -1,5 +1,6 @@
 # AppVeyor.com is a Continuous Integration service to build and run tests under
 # Windows
+# https://ci.appveyor.com/project/sklearn-ci/scikit-learn
 
 environment:
   global:
@@ -11,23 +12,28 @@ environment:
     WHEELHOUSE_UPLOADER_SECRET:
       secure: BQm8KfEj6v2Y+dQxb2syQvTFxDnHXvaNktkLcYSq7jfbTOO6eH9n09tfQzFUVcWZ
 
+    # Make sure we don't download large datasets when running the test on
+    # continuous integration platform
+    SKLEARN_SKIP_NETWORK_TESTS: 1
+
   matrix:
-    - PYTHON: "C:\\Python27_32"
+    - PYTHON: "C:\\Python27"
       PYTHON_VERSION: "2.7.8"
       PYTHON_ARCH: "32"
 
-    - PYTHON: "C:\\Python27_64"
+    - PYTHON: "C:\\Python27-x64"
       PYTHON_VERSION: "2.7.8"
       PYTHON_ARCH: "64"
 
-    - PYTHON: "C:\\Python34_32"
+    - PYTHON: "C:\\Python34"
       PYTHON_VERSION: "3.4.1"
       PYTHON_ARCH: "32"
 
-    - PYTHON: "C:\\Python34_64"
+    - PYTHON: "C:\\Python34-x64"
       PYTHON_VERSION: "3.4.1"
       PYTHON_ARCH: "64"
 
+
 install:
   # Install Python (from the official .msi of http://python.org) and pip when
   # not already installed.
@@ -39,7 +45,7 @@ install:
   - "python -c \"import struct; print(struct.calcsize('P') * 8)\""
 
   # Install the build and runtime dependencies of the project.
-  - "%CMD_IN_ENV% pip install -r continuous_integration/appveyor/requirements.txt"
+  - "%CMD_IN_ENV% pip install --timeout=60 --trusted-host 28daf2247a33ed269873-7b1aad3fab3cc330e1fd9d109892382a.r6.cf2.rackcdn.com -r continuous_integration/appveyor/requirements.txt"
   - "%CMD_IN_ENV% python setup.py bdist_wheel bdist_wininst -b doc/logos/scikit-learn-logo.bmp"
   - ps: "ls dist"
 
@@ -55,9 +61,7 @@ test_script:
   - "mkdir empty_folder"
   - "cd empty_folder"
 
-  # Skip joblib tests that require multiprocessing as they are prone to random
-  # slow down
-  - "python -c \"import nose; nose.main()\" -s sklearn"
+  - "python -c \"import nose; nose.main()\" -s -v sklearn"
 
   # Move back to the project folder
   - "cd .."
@@ -71,3 +75,9 @@ on_success:
   # On Windows, Apache Libcloud cannot find a standard CA cert bundle so we
   # disable the ssl checks.
   - "python -m wheelhouse_uploader upload --no-ssl-check --local-folder=dist sklearn-windows-wheels"
+
+notifications:
+  - provider: Webhook
+    url: https://webhooks.gitter.im/e/0dc8e57cd38105aeb1b4
+    on_build_success: false
+    on_build_failure: True
@@ -0,0 +1,97 @@
+from __future__ import print_function, division
+from time import time
+import argparse
+import numpy as np
+
+from sklearn.dummy import DummyClassifier
+
+from sklearn.datasets import fetch_20newsgroups_vectorized
+from sklearn.metrics import accuracy_score
+from sklearn.utils.validation import check_array
+
+from sklearn.ensemble import RandomForestClassifier
+from sklearn.ensemble import ExtraTreesClassifier
+from sklearn.ensemble import AdaBoostClassifier
+from sklearn.linear_model import LogisticRegression
+from sklearn.naive_bayes import MultinomialNB
+
+ESTIMATORS = {
+    "dummy": DummyClassifier(),
+    "random_forest": RandomForestClassifier(n_estimators=100,
+                                            max_features="sqrt",
+                                            min_samples_split=10),
+    "extra_trees": ExtraTreesClassifier(n_estimators=100,
+                                        max_features="sqrt",
+                                        min_samples_split=10),
+    "logistic_regression": LogisticRegression(),
+    "naive_bayes": MultinomialNB(),
+    "adaboost": AdaBoostClassifier(n_estimators=10),
+}
+
+
+###############################################################################
+# Data
+
+if __name__ == "__main__":
+
+    parser = argparse.ArgumentParser()
+    parser.add_argument('-e', '--estimators', nargs="+", required=True,
+                        choices=ESTIMATORS)
+    args = vars(parser.parse_args())
+
+    data_train = fetch_20newsgroups_vectorized(subset="train")
+    data_test = fetch_20newsgroups_vectorized(subset="test")
+    X_train = check_array(data_train.data, dtype=np.float32,
+                          accept_sparse="csc")
+    X_test = check_array(data_test.data, dtype=np.float32, accept_sparse="csr")
+    y_train = data_train.target
+    y_test = data_test.target
+
+    print("20 newsgroups")
+    print("=============")
+    print("X_train.shape = {0}".format(X_train.shape))
+    print("X_train.format = {0}".format(X_train.format))
+    print("X_train.dtype = {0}".format(X_train.dtype))
+    print("X_train density = {0}"
+          "".format(X_train.nnz / np.product(X_train.shape)))
+    print("y_train {0}".format(y_train.shape))
+    print("X_test {0}".format(X_test.shape))
+    print("X_test.format = {0}".format(X_test.format))
+    print("X_test.dtype = {0}".format(X_test.dtype))
+    print("y_test {0}".format(y_test.shape))
+    print()
+
+    print("Classifier Training")
+    print("===================")
+    accuracy, train_time, test_time = {}, {}, {}
+    for name in sorted(args["estimators"]):
+        clf = ESTIMATORS[name]
+        try:
+            clf.set_params(random_state=0)
+        except (TypeError, ValueError):
+            pass
+
+        print("Training %s ... " % name, end="")
+        t0 = time()
+        clf.fit(X_train, y_train)
+        train_time[name] = time() - t0
+        t0 = time()
+        y_pred = clf.predict(X_test)
+        test_time[name] = time() - t0
+        accuracy[name] = accuracy_score(y_test, y_pred)
+        print("done")
+
+    print()
+    print("Classification performance:")
+    print("===========================")
+    print()
+    print("%s %s %s %s" % ("Classifier  ", "train-time", "test-time",
+                           "Accuracy"))
+    print("-" * 44)
+    for name in sorted(accuracy, key=accuracy.get):
+        print("%s %s %s %s" % (name.ljust(16),
+                               ("%.4fs" % train_time[name]).center(10),
+                               ("%.4fs" % test_time[name]).center(10),
+                               ("%.4f" % accuracy[name]).center(10)))
+
+    print()