bradynapier
/

all_miniLM_L6_v2_with_attentions_onnx

Sentence Similarity

Transformers.js

feature-extraction

Model card Files Files and versions

bradynapier commited on 14 days ago

Commit

b470e31

·

verified ·

1 Parent(s): 6e5c530

Update README.md

Files changed (1) hide show

README.md +68 -1

README.md CHANGED Viewed

@@ -44,4 +44,71 @@ const model = await AutoModel.from_pretrained(MODEL_ID, {
 // the types are wildy incorrect... but this should get you what you need!
-```

 // the types are wildy incorrect... but this should get you what you need!
+```
+#### Rough Outline of Getting Attentions
+> This may not be the best way but the documentation is truly lacking and this does the job :-P
+```typescript
+/**
+ * Collect attentions across layers from a model.forward(...) output.
+ *
+ * ⚠️ Transformers.js variation:
+ * - Some builds return `{ attentions: Tensor[] }`.
+ * - Others return a dict with `attention_1`, `attention_2`, ... per layer.
+ *
+ * @internal
+ * @param out Raw dictionary from `model.forward(...)`.
+ * @returns Array of attention tensors (one per layer) with dims `[1, H, T, T]`.
+ */
+function collectAttentions(out: Record<string, Tensor>): XtTensor[] {
+  // Prefer array form if present (runtime feature; TS types don’t guarantee it).
+  const anyOut = out as unknown as { attentions?: XtTensor[] };
+  if (Array.isArray(anyOut.attentions)) return anyOut.attentions;
+  // Otherwise gather attention_1..attention_N and sort numerically by suffix.
+  const keys = Object.keys(out)
+    .filter((k) => /^attention_\d+$/i.test(k))
+    .sort(
+      (a, b) => parseInt(a.split('_')[1], 10) - parseInt(b.split('_')[1], 10),
+    );
+  return keys.map((k) => out[k] as unknown as XtTensor);
+}
+/**
+ * Tokenization:
+ * Prefer the public callable form `tokenizer(text, {...})` which returns tensors.
+ * In case your wrapper only exposes a `_call` (private-ish) we fall back to it here.
+ * The return includes `input_ids` and `attention_mask` tensors.
+ */
+const enc =
+  typeof (tokenizer as typeof tokenizer._call) === 'function' ?
+    // eslint-disable-next-line @typescript-eslint/await-thenable
+    await (tokenizer as typeof tokenizer._call)(text, {
+      add_special_tokens: true,
+    })
+  : tokenizer._call(text, { add_special_tokens: true }); // <-- documented hack
+// Convert tensor buffers (may be BigInt) → number[] for downstream processing.
+const input_ids = Array.from(
+  (enc.input_ids as Tensor).data as ArrayLike<number | bigint>,
+).map(Number);
+/**
+ * Forward pass with attentions.
+ *
+ * Another "crazy" bit: different Transformers.js builds expose attentions differently. We:
+ * - accept `{ attentions: Tensor[] }`, or
+ * - collect `attention_1, attention_2, ...` and sort them.
+ * Also, `Tensor` has no `.get(...)` so we do **flat buffer indexing** with `dims`.
+ */
+const out = (await model.forward({
+  input_ids,
+  attention_mask: windowAttentionMask,
+  output_attentions: true,
+})) as unknown as Record<string, Tensor>;
+const attentions = collectAttentions(out)
+```