Spaces:

av-codes
/

prompt-injection-detector

Running

av commited on about 18 hours ago

Commit

9d929f5

1 Parent(s): ed5b990

fix: use actual text length for HRM input instead of padding to 2048

Files changed (1) hide show

index.html CHANGED Viewed

@@ -521,16 +521,15 @@
     const bytes = encoder.encode(text);
     const len = Math.min(bytes.length, HRM_MAX_LEN);
-    const inputIds = new BigInt64Array(HRM_MAX_LEN);
-    const attentionMask = new BigInt64Array(HRM_MAX_LEN);
     for (let i = 0; i < len; i++) {
       inputIds[i] = BigInt(bytes[i]);
       attentionMask[i] = 1n;
     }
-    // Remaining positions are already 0 (padded)
-    return { inputIds, attentionMask };
   }
   async function analyzeDistilbert(text) {
@@ -540,11 +539,11 @@
   }
   async function analyzeHrm(text) {
-    const { inputIds, attentionMask } = tokenizeBytes(text);
     const ortLib = await getOrt();
-    const inputTensor = new ortLib.Tensor('int64', inputIds, [1, HRM_MAX_LEN]);
-    const maskTensor = new ortLib.Tensor('int64', attentionMask, [1, HRM_MAX_LEN]);
     const results = await hrmSession.run({
       input_ids: inputTensor,

     const bytes = encoder.encode(text);
     const len = Math.min(bytes.length, HRM_MAX_LEN);
+    const inputIds = new BigInt64Array(len);
+    const attentionMask = new BigInt64Array(len);
     for (let i = 0; i < len; i++) {
       inputIds[i] = BigInt(bytes[i]);
       attentionMask[i] = 1n;
     }
+    return { inputIds, attentionMask, seqLen: len };
   }
   async function analyzeDistilbert(text) {
   }
   async function analyzeHrm(text) {
+    const { inputIds, attentionMask, seqLen } = tokenizeBytes(text);
     const ortLib = await getOrt();
+    const inputTensor = new ortLib.Tensor('int64', inputIds, [1, seqLen]);
+    const maskTensor = new ortLib.Tensor('int64', attentionMask, [1, seqLen]);
     const results = await hrmSession.run({
       input_ids: inputTensor,