diff --git a/sklearn/cluster/tests/test_hierarchical.py b/sklearn/cluster/tests/test_hierarchical.py
index 2121eef7d416577767d223c247c0aefe817264c6..8c4f06598bae38db622cccc2801290bb8e512d3e 100644
--- a/sklearn/cluster/tests/test_hierarchical.py
+++ b/sklearn/cluster/tests/test_hierarchical.py
@@ -87,6 +87,8 @@ def test_ward_clustering():
     clustering.fit(X)
     labels = clustering.labels_
     assert_true(np.size(np.unique(labels)) == 10)
+    # Turn caching off now
+    clustering = Ward(n_clusters=10, connectivity=connectivity)
     # Check that we obtain the same solution with early-stopping of the
     # tree building
     clustering.compute_full_tree = False