githubnext · github-actions · May 13, 2026 · May 13, 2026 · May 14, 2026 · May 14, 2026
diff --git a/biome.json b/biome.json
@@ -4,7 +4,11 @@
   "linter": {
     "enabled": true,
     "rules": {
-      "recommended": true
+      "recommended": true,
+      "style": {
+        "noNonNullAssertion": "off",
+        "noInferrableTypes": "off"
+      }
     }
   },
   "formatter": {

diff --git a/playground/index.html b/playground/index.html
@@ -116,6 +116,36 @@ <h3>ensemble</h3>
       <p>RandomForest, GradientBoosting, AdaBoost</p>
       <span class="status pending">🕐 Pending</span>
     </div>
+    <div class="card">
+      <h3>feature_extraction.text</h3>
+      <p>CountVectorizer, TfidfVectorizer, HashingVectorizer</p>
+      <span class="status done">✅ Implemented</span>
+    </div>
+    <div class="card">
+      <h3>kernel_approximation</h3>
+      <p>RBFSampler, Nystroem, AdditiveChi2Sampler</p>
+      <span class="status done">✅ Implemented</span>
+    </div>
+    <div class="card">
+      <h3>covariance</h3>
+      <p>EmpiricalCovariance, ShrunkCovariance, LedoitWolf, OAS</p>
+      <span class="status done">✅ Implemented</span>
+    </div>
+    <div class="card">
+      <h3>cross_decomposition</h3>
+      <p>PLSRegression, PLSSVD</p>
+      <span class="status done">✅ Implemented</span>
+    </div>
+    <div class="card">
+      <h3>preprocessing (extended)</h3>
+      <p>PowerTransformer, QuantileTransformer, Binarizer, FunctionTransformer</p>
+      <span class="status done">✅ Implemented</span>
+    </div>
+    <div class="card">
+      <h3>decomposition (extended)</h3>
+      <p>IncrementalPCA, KernelPCA, FactorAnalysis</p>
+      <span class="status done">✅ Implemented</span>
+    </div>
   </div>
 
   <div class="demo-container">

diff --git a/src/calibration/calibration.ts b/src/calibration/calibration.ts
@@ -0,0 +1,141 @@
+/**
+ * Probability calibration.
+ * Mirrors sklearn.calibration.CalibratedClassifierCV.
+ * Uses Platt scaling (logistic) or isotonic regression for calibration.
+ */
+
+import { NotFittedError } from "../exceptions.js";
+
+interface Classifier {
+  fit(X: Float64Array[], y: Float64Array): this;
+  predict(X: Float64Array[]): Float64Array;
+  score?(X: Float64Array[], y: Float64Array): number;
+}
+
+function sigmoid(x: number): number {
+  return 1 / (1 + Math.exp(-x));
+}
+
+/** Platt scaling: fit a logistic function on scores to map to probabilities. */
+function plattScale(scores: Float64Array, y: Float64Array): [number, number] {
+  const n = scores.length;
+  let A = 0;
+  let B = 0;
+  const lr = 0.01;
+
+  for (let iter = 0; iter < 1000; iter++) {
+    let gradA = 0;
+    let gradB = 0;
+    for (let i = 0; i < n; i++) {
+      const p = sigmoid(A * (scores[i] ?? 0) + B);
+      const err = p - (y[i] ?? 0);
+      gradA += err * (scores[i] ?? 0);
+      gradB += err;
+    }
+    A -= lr * gradA / n;
+    B -= lr * gradB / n;
+  }
+
+  return [A, B];
+}
+
+export class CalibratedClassifierCV {
+  baseEstimator: Classifier;
+  method: string;
+  cv: number;
+
+  calibratedEstimators_: {
+    estimator: Classifier;
+    A: number;
+    B: number;
+  }[] | null = null;
+  classes_: Float64Array | null = null;
+
+  constructor(
+    baseEstimator: Classifier,
+    options: { method?: string; cv?: number } = {},
+  ) {
+    this.baseEstimator = baseEstimator;
+    this.method = options.method ?? "sigmoid";
+    this.cv = options.cv ?? 5;
+  }
+
+  fit(X: Float64Array[], y: Float64Array): this {
+    const n = X.length;
+    const uniqueClasses = Array.from(new Set(Array.from(y))).sort((a, b) => a - b);
+    this.classes_ = new Float64Array(uniqueClasses);
+    const posClass = uniqueClasses[uniqueClasses.length - 1] ?? 1;
+
+    const yBin = new Float64Array(y.map((yi) => (yi === posClass ? 1 : 0)));
+
+    // Simple hold-out calibration
+    const foldSize = Math.floor(n / this.cv);
+    this.calibratedEstimators_ = [];
+
+    for (let fold = 0; fold < this.cv; fold++) {
+      const testStart = fold * foldSize;
+      const testEnd = fold === this.cv - 1 ? n : testStart + foldSize;
+
+      const trainIdx: number[] = [];
+      const testIdx: number[] = [];
+      for (let i = 0; i < n; i++) {
+        if (i >= testStart && i < testEnd) testIdx.push(i);
+        else trainIdx.push(i);
+      }
+
+      const XTrain = trainIdx.map((i) => X[i] ?? new Float64Array(0));
+      const yTrain = new Float64Array(trainIdx.map((i) => y[i] ?? 0));
+      const XTest = testIdx.map((i) => X[i] ?? new Float64Array(0));
+      const yTest = new Float64Array(testIdx.map((i) => yBin[i] ?? 0));
+
+      const est = Object.create(Object.getPrototypeOf(this.baseEstimator) as object) as Classifier;
+      Object.assign(est, this.baseEstimator);
+      est.fit(XTrain, yTrain);
+
+      const testPred = est.predict(XTest);
+      const [A, B] = plattScale(testPred, yTest);
+
+      this.calibratedEstimators_.push({ estimator: est, A, B });
+    }
+
+    return this;
+  }
+
+  predictProba(X: Float64Array[]): Float64Array[] {
+    if (this.calibratedEstimators_ === null) throw new NotFittedError("CalibratedClassifierCV");
+
+    const n = X.length;
+    const probs = new Float64Array(n);
+
+    for (const { estimator, A, B } of this.calibratedEstimators_) {
+      const scores = estimator.predict(X);
+      for (let i = 0; i < n; i++) {
+        probs[i] = (probs[i] ?? 0) + sigmoid(A * (scores[i] ?? 0) + B);
+      }
+    }
+
+    const k = this.calibratedEstimators_.length;
+    return Array.from({ length: n }, (_, i) => {
+      const p = (probs[i] ?? 0) / k;
+      return new Float64Array([1 - p, p]);
+    });
+  }
+
+  predict(X: Float64Array[]): Float64Array {
+    if (this.classes_ === null) throw new NotFittedError("CalibratedClassifierCV");
+    const classes = this.classes_;
+    const proba = this.predictProba(X);
+    const posClass = classes[classes.length - 1] ?? 1;
+    const negClass = classes[0] ?? 0;
+    return new Float64Array(proba.map((p) => ((p[1] ?? 0) >= 0.5 ? posClass : negClass)));
+  }
+
+  score(X: Float64Array[], y: Float64Array): number {
+    const pred = this.predict(X);
+    let correct = 0;
+    for (let i = 0; i < y.length; i++) {
+      if (pred[i] === y[i]) correct++;
+    }
+    return correct / y.length;
+  }
+}
diff --git a/src/calibration/index.ts b/src/calibration/index.ts
@@ -0,0 +1 @@
+export * from "./calibration.js";
diff --git a/src/cluster/affinity_propagation.ts b/src/cluster/affinity_propagation.ts
@@ -0,0 +1,199 @@
+/**
+ * AffinityPropagation clustering.
+ */
+
+import { NotFittedError } from "../exceptions.js";
+
+export interface AffinityPropagationOptions {
+  dampingFactor?: number;
+  maxIter?: number;
+  convergenceIter?: number;
+  preference?: number;
+}
+
+export class AffinityPropagation {
+  private dampingFactor: number;
+  private maxIter: number;
+  private convergenceIter: number;
+  private preference: number | undefined;
+
+  labels_: Int32Array | null = null;
+  clusterCentersIndices_: Int32Array | null = null;
+  nIter_ = 0;
+
+  constructor(options: AffinityPropagationOptions = {}) {
+    this.dampingFactor = options.dampingFactor ?? 0.5;
+    this.maxIter = options.maxIter ?? 200;
+    this.convergenceIter = options.convergenceIter ?? 15;
+    this.preference = options.preference;
+  }
+
+  fit(X: Float64Array[]): this {
+    const n = X.length;
+    if (n === 0) {
+      this.labels_ = new Int32Array(0);
+      this.clusterCentersIndices_ = new Int32Array(0);
+      return this;
+    }
+
+    // Build similarity matrix S = -||xi - xj||^2
+    const S: Float64Array[] = Array.from(
+      { length: n },
+      () => new Float64Array(n),
+    );
+    for (let i = 0; i < n; i++) {
+      const xi = X[i] ?? new Float64Array(0);
+      for (let j = i; j < n; j++) {
+        const xj = X[j] ?? new Float64Array(0);
+        let d = 0;
+        for (let k = 0; k < xi.length; k++)
+          d += ((xi[k] ?? 0) - (xj[k] ?? 0)) ** 2;
+        (S[i] as Float64Array)[j] = -d;
+        (S[j] as Float64Array)[i] = -d;
+      }
+    }
+
+    // Set preference (diagonal)
+    let pref = this.preference;
+    if (pref === undefined) {
+      // Median of similarities
+      const vals: number[] = [];
+      for (let i = 0; i < n; i++)
+        for (let j = i + 1; j < n; j++)
+          vals.push((S[i] as Float64Array)[j] ?? 0);
+      vals.sort((a, b) => a - b);
+      pref = vals[Math.floor(vals.length / 2)] ?? -1;
+    }
+    for (let i = 0; i < n; i++) (S[i] as Float64Array)[i] = pref;
+
+    // Responsibility R and Availability A matrices
+    const R: Float64Array[] = Array.from(
+      { length: n },
+      () => new Float64Array(n),
+    );
+    const A: Float64Array[] = Array.from(
+      { length: n },
+      () => new Float64Array(n),
+    );
+    const d = this.dampingFactor;
+    let stableCount = 0;
+    let prevExemplars: Set<number> = new Set();
+
+    for (let iter = 0; iter < this.maxIter; iter++) {
+      // Update responsibilities: R(i,k) = S(i,k) - max_{k'!=k}[A(i,k')+S(i,k')]
+      for (let i = 0; i < n; i++) {
+        const Si = S[i] ?? new Float64Array(n);
+        const Ai = A[i] ?? new Float64Array(n);
+        // Find two highest A+S values
+        let max1 = Number.NEGATIVE_INFINITY;
+        let max2 = Number.NEGATIVE_INFINITY;
+        let argmax1 = -1;
+        for (let k = 0; k < n; k++) {
+          const v = (Ai[k] ?? 0) + (Si[k] ?? 0);
+          if (v > max1) {
+            max2 = max1;
+            max1 = v;
+            argmax1 = k;
+          } else if (v > max2) max2 = v;
+        }
+        const Ri = R[i] ?? new Float64Array(n);
+        for (let k = 0; k < n; k++) {
+          const maxOther = k === argmax1 ? max2 : max1;
+          const newR = (Si[k] ?? 0) - maxOther;
+          Ri[k] = d * (Ri[k] ?? 0) + (1 - d) * newR;
+        }
+      }
+
+      // Update availabilities
+      for (let k = 0; k < n; k++) {
+        // sum of positive R(i',k) for i'!=k
+        let sumPos = 0;
+        for (let i = 0; i < n; i++) {
+          if (i === k) continue;
+          const v = (R[i] as Float64Array)[k] ?? 0;
+          if (v > 0) sumPos += v;
+        }
+        const rkk = (R[k] as Float64Array)[k] ?? 0;
+        for (let i = 0; i < n; i++) {
+          const Ai = A[i] ?? new Float64Array(n);
+          let newA: number;
+          if (i === k) {
+            newA = sumPos;
+          } else {
+            const rik = (R[i] as Float64Array)[k] ?? 0;
+            const sumWithout = sumPos - (rik > 0 ? rik : 0);
+            newA = Math.min(0, rkk + sumWithout);
+          }
+          Ai[k] = d * (Ai[k] ?? 0) + (1 - d) * newA;
+        }
+      }
+
+      // Check convergence
+      const exemplars = new Set<number>();
+      for (let i = 0; i < n; i++) {
+        const Ai = A[i] ?? new Float64Array(n);
+        const Ri = R[i] ?? new Float64Array(n);
+        let best = Number.NEGATIVE_INFINITY;
+        let bestK = 0;
+        for (let k = 0; k < n; k++) {
+          const v = (Ai[k] ?? 0) + (Ri[k] ?? 0);
+          if (v > best) {
+            best = v;
+            bestK = k;
+          }
+        }
+        exemplars.add(bestK);
+      }
+
+      const same =
+        exemplars.size === prevExemplars.size &&
+        [...exemplars].every((e) => prevExemplars.has(e));
+      if (same) {
+        stableCount++;
+        if (stableCount >= this.convergenceIter) {
+          this.nIter_ = iter + 1;
+          break;
+        }
+      } else {
+        stableCount = 0;
+      }
+      prevExemplars = exemplars;
+      this.nIter_ = iter + 1;
+    }
+
+    // Assign labels
+    const labels = new Int32Array(n);
+    for (let i = 0; i < n; i++) {
+      const Ai = A[i] ?? new Float64Array(n);
+      const Ri = R[i] ?? new Float64Array(n);
+      let best = Number.NEGATIVE_INFINITY;
+      let bestK = 0;
+      for (let k = 0; k < n; k++) {
+        const v = (Ai[k] ?? 0) + (Ri[k] ?? 0);
+        if (v > best) {
+          best = v;
+          bestK = k;
+        }
+      }
+      labels[i] = bestK;
+    }
+
+    const centerSet = new Set<number>(Array.from(labels));
+    const centers = Int32Array.from([...centerSet].sort((a, b) => a - b));
+    // Relabel to 0..k-1
+    const map = new Map<number, number>();
+    centers.forEach((c, idx) => map.set(c, idx));
+    for (let i = 0; i < n; i++) labels[i] = map.get(labels[i] ?? 0) ?? 0;
+
+    this.labels_ = labels;
+    this.clusterCentersIndices_ = centers;
+    return this;
+  }
+
+  predict(X: Float64Array[]): Int32Array {
+    if (!this.labels_ || !this.clusterCentersIndices_)
+      throw new NotFittedError("AffinityPropagation");
+    // Not supported post-fit without stored data; return empty
+    return new Int32Array(X.length).fill(-1);
+  }
+}