X.shape = (5000, 15)
y.shape = (5000,)
X_train_tf,X_test_tf, y_train_tf, y_test_tf = train_test_split(final,duplicate, stratify=y_true, test_size=0.3,random_state=13)
Ошибка:
---------------------------------------------------------------------------
ValueError Traceback (most recent call last)
<ipython-input-117-3e272bbb265d> in <module>
----> 1 X_train_tf,X_test_tf, y_train_tf, y_test_tf = train_test_split(final,duplicate, stratify=y_true, test_size=0.3,random_state=13)
D:\Anaconda\lib\site-packages\sklearn\model_selection\_split.py in train_test_split(*arrays, **options)
2141 random_state=random_state)
2142
-> 2143 train, test = next(cv.split(X=arrays[0], y=stratify))
2144
2145 return list(chain.from_iterable((_safe_indexing(a, train),
D:\Anaconda\lib\site-packages\sklearn\model_selection\_split.py in split(self, X, y, groups)
1326 to an integer.
1327 """
-> 1328 X, y, groups = indexable(X, y, groups)
1329 for train, test in self._iter_indices(X, y, groups):
1330 yield train, test
D:\Anaconda\lib\site-packages\sklearn\utils\validation.py in indexable(*iterables)
246 """
247 result = [_make_indexable(X) for X in iterables]
--> 248 check_consistent_length(*result)
249 return result
250
D:\Anaconda\lib\site-packages\sklearn\utils\validation.py in check_consistent_length(*arrays)
210 if len(uniques) > 1:
211 raise ValueError("Found input variables with inconsistent numbers of"
--> 212 " samples: %r" % [int(l) for l in lengths])
213
214
ValueError: Found input variables with inconsistent numbers of samples: [404290, 100000]