import logging
from sklearn.datasets import fetch_rcv1
from sklearn.multiclass import OneVsRestClassifier
from sklearn.metrics import f1_score, precision_score, recall_score
from sklearn.pipeline import Pipeline
from sklearn import svm
logging.basicConfig()
rcv1 = fetch_rcv1()
training_samples = 23149
X_train = rcv1.data[:training_samples]
X_test = rcv1.data[training_samples:]
y_train = rcv1.target[:training_samples]
y_test = rcv1.target[training_samples:]
sample_ids = rcv1.sample_id[:training_samples]
sample_ids[-1]
26150