We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent d565ed4 commit f01c3c1Copy full SHA for f01c3c1
1 file changed
WDoc/utils/tasks/query.py
@@ -209,6 +209,7 @@ def semantic_batching(
209
vr = np.cumsum(pca.explained_variance_ratio_)[-1]
210
if vr <= 0.90:
211
red(f"Found lower than exepcted PCA explained variance ratio: {vr:.4f}")
212
+ assert vr >= 0.75, f"Found substancially low explained variance ratio afer pca at {vr:.4f} so not using dimension reduction"
213
embeddings = pd.DataFrame(
214
columns=[f"v_{i}" for i in range(embeds_reduced.shape[1])],
215
index=[i for i in range(len(texts))],
0 commit comments