ķ
\c           @   sĒ   d  Z  d d l Z d d l j Z d d l Z d d l m Z d d l	 m
 Z
 d d l m Z d d l m Z d d l m Z d d l m Z d d	 l m Z d
   Z d S(   sO   Test the rcv1 loader.

Skipped if rcv1 is not already downloaded to data_home.
i˙˙˙˙N(   t   partial(   t
   fetch_rcv1(   t   check_return_X_y(   t   assert_almost_equal(   t   assert_array_equal(   t   assert_equal(   t   SkipTestc       	   C   sđ  y t  d t d t  }  Wn4 t k
 rO } | j t j k rP t d   qP n X|  j |  j } } |  j j	   |  j
 } } t j |  s t  t j |  sĻ t  t d | j j  t d | j j  t d | j  t d | j  t d  | j  t d t |   d	 d
 d d d d g } t | | d   d! } d" } xO t | |  D]> \ }	 }
 | j |
  } t |	 | d  d   | f j j  qTWt  d t d d d d d t  } | j | j } } | j
 } t t  d t d d d t } t | |  t t j | d   t j |   d# } xÂ | D]ē } | j	   j |  } | j	   j |  } | | d  d   f j   } | | d  d   f j   } t | |  | | d  d   f j   } | | d  d   f j   } t | |  q.Wd  S($   Nt   shufflet   download_if_missings'   Download RCV1 dataset to run this test.iŠ}ĄiĮ' i>F i¸  ig   u   C11u   C12u   C13u   C14u   C15u   C151i   t   GMILt   E143t   CCATi   iļ  iŅ t   subsett   traint   random_stateiM   imZ  iî  iĘ  iÚ6  (   i>F i¸  (   i>F ig   (   i>F (   R	   R
   R   (   i   iļ  iŅ (   iî  iĘ  iÚ6  (   R   t   Falset   IOErrort   errnot   ENOENTR   t   datat   targett   target_namest   tolistt	   sample_idt   spt   issparset   AssertionErrorR   t   sizet   shapet   lenR   t   zipt   indext   TrueR    R   t   npt   sortt   toarrayR   (   t   data1t   et   X1t   Y1t   cat_listt   s1t   first_categoriest   some_categoriest   number_non_zero_in_catt   numt   catt   jt   data2t   X2t   Y2t   s2t
   fetch_funct   some_sample_idsR   t   idx1t   idx2t   feature_values_1t   feature_values_2t   target_values_1t   target_values_2(    (    s?   lib/python2.7/site-packages/sklearn/datasets/tests/test_rcv1.pyt   test_fetch_rcv1   sP    '			#(   t   __doc__R   t   scipy.sparset   sparseR   t   numpyR!   t	   functoolsR    t   sklearn.datasetsR   t"   sklearn.datasets.tests.test_commonR   t   sklearn.utils.testingR   R   R   R   R<   (    (    (    s?   lib/python2.7/site-packages/sklearn/datasets/tests/test_rcv1.pyt   <module>   s   