Merge pull request #103 from nyanp/bugfix/fix-ci-errors

Fix ci errors, close #101, #102
bugfix/flake8
nyanp 2023-07-11 00:27:14 +09:00 committed by GitHub
commit 44b0169e4e
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 3 additions and 3 deletions

View File

@ -174,7 +174,7 @@ class TargetEncoder(KFoldEncoderWrapper):
groups: Optional[pd.Series] = None,
cols: List[str] = None,
drop_invariant: bool = False, handle_missing: str = 'value', handle_unknown: str = 'value',
min_samples_leaf: int = 1, smoothing: float = 1.0, return_same_type: bool = True):
min_samples_leaf: int = 20, smoothing: float = 10.0, return_same_type: bool = True):
e = ce.TargetEncoder(cols=cols, drop_invariant=drop_invariant, return_df=True,
handle_missing=handle_missing,
handle_unknown=handle_unknown,

View File

@ -116,7 +116,7 @@ class BertSentenceVectorizer(BaseFeaturizer):
X = convert_input(X)
tqdm.pandas()
columns = self.text_columns or [c for c in X.columns if X[c].dtype == np.object]
columns = self.text_columns or [c for c in X.columns if X[c].dtype == object]
non_text_columns = [c for c in X.columns if c not in columns]
column_names = []

View File

@ -450,7 +450,7 @@ class StratifiedGroupKFold(_BaseKFold):
split_diffs[splitx] = cand_diffs[splitx]
grouped_splitx.append(splitx)
test_folds = np.empty(n_samples, dtype=np.int)
test_folds = np.empty(n_samples, dtype=int)
for group_idx, splitx in zip(sortx, grouped_splitx):
idxs = group_idxs[group_idx]
test_folds[idxs] = splitx