Spaces:
Running
Running
added helpers
Browse files- wm_interactive/static/styles.css +94 -0
- wm_interactive/templates/index.html +125 -15
wm_interactive/static/styles.css
CHANGED
@@ -354,4 +354,98 @@ h1 {
|
|
354 |
|
355 |
.floating-btn.generating .stop-icon {
|
356 |
display: block;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
357 |
}
|
|
|
354 |
|
355 |
.floating-btn.generating .stop-icon {
|
356 |
display: block;
|
357 |
+
}
|
358 |
+
|
359 |
+
/* Help documentation styles */
|
360 |
+
.param-help-icon {
|
361 |
+
color: #6e6e80;
|
362 |
+
font-size: 14px;
|
363 |
+
cursor: pointer;
|
364 |
+
}
|
365 |
+
|
366 |
+
.help-modal-body {
|
367 |
+
max-height: 70vh;
|
368 |
+
overflow-y: auto;
|
369 |
+
}
|
370 |
+
|
371 |
+
.help-modal-body h4 {
|
372 |
+
margin-top: 1.5rem;
|
373 |
+
margin-bottom: 0.75rem;
|
374 |
+
font-size: 1.1rem;
|
375 |
+
font-weight: 600;
|
376 |
+
color: #10a37f;
|
377 |
+
}
|
378 |
+
|
379 |
+
.help-modal-body h4:first-child {
|
380 |
+
margin-top: 0;
|
381 |
+
}
|
382 |
+
|
383 |
+
.help-modal-body p {
|
384 |
+
margin-bottom: 1rem;
|
385 |
+
line-height: 1.6;
|
386 |
+
}
|
387 |
+
|
388 |
+
.help-modal-body ol, .help-modal-body ul {
|
389 |
+
margin-bottom: 1rem;
|
390 |
+
padding-left: 1.5rem;
|
391 |
+
}
|
392 |
+
|
393 |
+
.help-modal-body li {
|
394 |
+
margin-bottom: 0.5rem;
|
395 |
+
}
|
396 |
+
|
397 |
+
.help-description-list dt {
|
398 |
+
font-weight: 600;
|
399 |
+
margin-bottom: 0.25rem;
|
400 |
+
}
|
401 |
+
|
402 |
+
.help-description-list dd {
|
403 |
+
margin-bottom: 1rem;
|
404 |
+
margin-left: 1rem;
|
405 |
+
}
|
406 |
+
|
407 |
+
.paper-references {
|
408 |
+
list-style: none;
|
409 |
+
padding-left: 0;
|
410 |
+
}
|
411 |
+
|
412 |
+
.paper-references li {
|
413 |
+
margin-bottom: 0.75rem;
|
414 |
+
padding-left: 1rem;
|
415 |
+
border-left: 3px solid #e5e5e5;
|
416 |
+
}
|
417 |
+
|
418 |
+
.paper-references a {
|
419 |
+
display: block;
|
420 |
+
color: #10a37f;
|
421 |
+
font-weight: 500;
|
422 |
+
margin-bottom: 0.25rem;
|
423 |
+
}
|
424 |
+
|
425 |
+
.paper-authors {
|
426 |
+
display: block;
|
427 |
+
color: #6e6e80;
|
428 |
+
font-size: 0.9rem;
|
429 |
+
font-style: italic;
|
430 |
+
}
|
431 |
+
|
432 |
+
/* Tooltip adjustments for parameter help icons */
|
433 |
+
.tooltip {
|
434 |
+
--bs-tooltip-max-width: 300px;
|
435 |
+
--bs-tooltip-opacity: 1;
|
436 |
+
--bs-tooltip-padding-y: 0.5rem;
|
437 |
+
--bs-tooltip-padding-x: 0.75rem;
|
438 |
+
--bs-tooltip-bg: rgba(26, 26, 26, 0.95);
|
439 |
+
font-size: 13px;
|
440 |
+
line-height: 1.4;
|
441 |
+
}
|
442 |
+
|
443 |
+
@media (max-width: 768px) {
|
444 |
+
.help-modal-body {
|
445 |
+
max-height: 60vh;
|
446 |
+
}
|
447 |
+
|
448 |
+
.tooltip {
|
449 |
+
--bs-tooltip-max-width: 200px;
|
450 |
+
}
|
451 |
}
|
wm_interactive/templates/index.html
CHANGED
@@ -11,9 +11,97 @@
|
|
11 |
<div class="container">
|
12 |
<div class="d-flex justify-content-between align-items-center">
|
13 |
<h1>Interactive watermark detector</h1>
|
14 |
-
<
|
15 |
-
<
|
16 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
17 |
</div>
|
18 |
|
19 |
<!-- Advanced Parameters Modal -->
|
@@ -26,7 +114,10 @@
|
|
26 |
</div>
|
27 |
<div class="modal-body">
|
28 |
<div class="mb-3">
|
29 |
-
<
|
|
|
|
|
|
|
30 |
<select class="form-select" id="detectorType">
|
31 |
<option value="maryland">Maryland</option>
|
32 |
<option value="marylandz">Maryland Z-score</option>
|
@@ -36,22 +127,34 @@
|
|
36 |
<div class="form-text">Type of watermark detection algorithm</div>
|
37 |
</div>
|
38 |
<div class="mb-3">
|
39 |
-
<
|
|
|
|
|
|
|
40 |
<input type="number" class="form-control" id="seed" value="0">
|
41 |
<div class="form-text">Random seed for the watermark detector</div>
|
42 |
</div>
|
43 |
<div class="mb-3">
|
44 |
-
<
|
|
|
|
|
|
|
45 |
<input type="number" class="form-control" id="ngram" value="1">
|
46 |
<div class="form-text">Size of the n-gram window used for detection</div>
|
47 |
</div>
|
48 |
<div class="mb-3">
|
49 |
-
<
|
|
|
|
|
|
|
50 |
<input type="number" step="0.1" class="form-control" id="delta" value="2.0">
|
51 |
<div class="form-text">Bias added to greenlist tokens (for Maryland method)</div>
|
52 |
</div>
|
53 |
<div class="mb-3">
|
54 |
-
<
|
|
|
|
|
|
|
55 |
<input type="number" step="0.1" class="form-control" id="temperature" value="0.8">
|
56 |
<div class="form-text">Temperature for sampling (higher = more random)</div>
|
57 |
</div>
|
@@ -137,6 +240,20 @@
|
|
137 |
const deltaInput = document.getElementById('delta');
|
138 |
const temperatureInput = document.getElementById('temperature');
|
139 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
140 |
function startGeneration() {
|
141 |
const prompt = promptArea.value.trim();
|
142 |
if (!prompt) {
|
@@ -439,13 +556,6 @@
|
|
439 |
});
|
440 |
});
|
441 |
|
442 |
-
// Initial tokenization with error handling
|
443 |
-
document.addEventListener('DOMContentLoaded', function() {
|
444 |
-
updateTokenization().catch(error => {
|
445 |
-
console.error('Error during initial tokenization:', error);
|
446 |
-
});
|
447 |
-
});
|
448 |
-
|
449 |
// Add this helper function for formatting p-values
|
450 |
function formatPValue(value) {
|
451 |
if (value >= 0.001) {
|
|
|
11 |
<div class="container">
|
12 |
<div class="d-flex justify-content-between align-items-center">
|
13 |
<h1>Interactive watermark detector</h1>
|
14 |
+
<div class="d-flex gap-2">
|
15 |
+
<button class="btn btn-outline-secondary" data-bs-toggle="modal" data-bs-target="#helpModal">
|
16 |
+
<i class="bi bi-question-circle"></i>
|
17 |
+
</button>
|
18 |
+
<button class="btn btn-outline-secondary" data-bs-toggle="modal" data-bs-target="#paramsModal">
|
19 |
+
<i class="bi bi-gear"></i>
|
20 |
+
</button>
|
21 |
+
</div>
|
22 |
+
</div>
|
23 |
+
|
24 |
+
<!-- Help Modal -->
|
25 |
+
<div class="modal fade" id="helpModal" tabindex="-1">
|
26 |
+
<div class="modal-dialog modal-lg">
|
27 |
+
<div class="modal-content">
|
28 |
+
<div class="modal-header">
|
29 |
+
<h5 class="modal-title">Watermark Detection Help</h5>
|
30 |
+
<button type="button" class="btn-close" data-bs-dismiss="modal"></button>
|
31 |
+
</div>
|
32 |
+
<div class="modal-body help-modal-body">
|
33 |
+
<h4>What is LLM watermarking?</h4>
|
34 |
+
<p>LLM watermarking is a technique that slightly modifies how language models generate text, making it possible to detect if text was generated by a specific AI model without visibly changing the text quality.</p>
|
35 |
+
|
36 |
+
<h4>How to use this demo</h4>
|
37 |
+
<ol>
|
38 |
+
<li>Enter a prompt in the top text area to generate watermarked text</li>
|
39 |
+
<li>The generated text will appear in the second text box</li>
|
40 |
+
<li>The text will be automatically analyzed to show which tokens (parts of text) were influenced by the watermark</li>
|
41 |
+
<li>The statistics at the bottom show the detection results</li>
|
42 |
+
<li>You can also paste any text in the second box to test if it contains a watermark</li>
|
43 |
+
</ol>
|
44 |
+
|
45 |
+
<h4>Detection Methods</h4>
|
46 |
+
<p><strong>Maryland</strong>: A token-level detection algorithm that analyzes how unexpected each token is, based on the paper "<a href="https://arxiv.org/abs/2301.10226" target="_blank">A Watermark for Large Language Models</a>" by Kirchenbauer et al.</p>
|
47 |
+
<p><strong>Maryland Z-score</strong>: A variant of the Maryland detector that uses z-scores for better statistical interpretation.</p>
|
48 |
+
<p><strong>OpenAI</strong>: A watermarking method similar to what was described in "<a href="https://arxiv.org/abs/2306.04634" target="_blank">A Watermark for Large Language Models</a>" by Kirchenbauer et al., inspired by initial reports from OpenAI.</p>
|
49 |
+
<p><strong>OpenAI Z-score</strong>: A variant of the OpenAI detector that uses z-scores for better statistical interpretation.</p>
|
50 |
+
|
51 |
+
<h4>Parameters Explained</h4>
|
52 |
+
<dl class="help-description-list">
|
53 |
+
<dt>Detector Type</dt>
|
54 |
+
<dd>The algorithm used to detect watermarks in the text. Different detectors perform better in different scenarios.</dd>
|
55 |
+
|
56 |
+
<dt>Seed</dt>
|
57 |
+
<dd>The random seed used for watermarking. The detector must use the same seed that was used when generating the text. In a real-world scenario, this would be kept private by the model provider.</dd>
|
58 |
+
|
59 |
+
<dt>N-gram Size</dt>
|
60 |
+
<dd>The number of previous tokens considered when choosing "greenlist" tokens. Larger values make the watermark more robust against edits but may reduce text quality.</dd>
|
61 |
+
|
62 |
+
<dt>Delta</dt>
|
63 |
+
<dd>The bias added to "greenlist" tokens during generation. Higher values make the watermark stronger but might affect text quality. Typical values range from 1.0 to 5.0.</dd>
|
64 |
+
|
65 |
+
<dt>Temperature</dt>
|
66 |
+
<dd>Controls randomness in text generation. Higher values (e.g., 1.0) produce more diverse outputs; lower values (e.g., 0.2) make outputs more focused and deterministic.</dd>
|
67 |
+
</dl>
|
68 |
+
|
69 |
+
<h4>Understanding Results</h4>
|
70 |
+
<dl class="help-description-list">
|
71 |
+
<dt>Tokens</dt>
|
72 |
+
<dd>The total number of tokens in the analyzed text. Tokens are units of text that may represent words, parts of words, or punctuation.</dd>
|
73 |
+
|
74 |
+
<dt>Scored Tokens</dt>
|
75 |
+
<dd>The number of tokens that were actually evaluated by the detector (excludes first few tokens that don't have enough context).</dd>
|
76 |
+
|
77 |
+
<dt>Final Score</dt>
|
78 |
+
<dd>A measure of how likely the text contains a watermark. Higher scores indicate stronger evidence of watermarking.</dd>
|
79 |
+
|
80 |
+
<dt>P-value</dt>
|
81 |
+
<dd>The statistical significance of the detection. Lower values (especially p < 0.05) indicate strong evidence that the text was watermarked. Values close to 0.5 suggest no watermark is present.</dd>
|
82 |
+
</dl>
|
83 |
+
|
84 |
+
<h4>Related Papers</h4>
|
85 |
+
<ul class="paper-references">
|
86 |
+
<li>
|
87 |
+
<a href="https://arxiv.org/abs/2301.10226" target="_blank">A Watermark for Large Language Models</a>
|
88 |
+
<span class="paper-authors">Kirchenbauer, Geiping, et al. (2023)</span>
|
89 |
+
</li>
|
90 |
+
<li>
|
91 |
+
<a href="https://arxiv.org/abs/2306.04634" target="_blank">Robust Distortion-free Watermarks for Language Models</a>
|
92 |
+
<span class="paper-authors">Kuditipudi, Thickstun, et al. (2023)</span>
|
93 |
+
</li>
|
94 |
+
<li>
|
95 |
+
<a href="https://arxiv.org/abs/2305.08883" target="_blank">Provable Robust Watermarking for AI-Generated Text</a>
|
96 |
+
<span class="paper-authors">Christ, Mireshghallah, et al. (2023)</span>
|
97 |
+
</li>
|
98 |
+
</ul>
|
99 |
+
</div>
|
100 |
+
<div class="modal-footer">
|
101 |
+
<button type="button" class="btn btn-primary" data-bs-dismiss="modal">Close</button>
|
102 |
+
</div>
|
103 |
+
</div>
|
104 |
+
</div>
|
105 |
</div>
|
106 |
|
107 |
<!-- Advanced Parameters Modal -->
|
|
|
114 |
</div>
|
115 |
<div class="modal-body">
|
116 |
<div class="mb-3">
|
117 |
+
<div class="d-flex align-items-center">
|
118 |
+
<i class="bi bi-info-circle param-help-icon me-2" data-bs-toggle="tooltip" title="The algorithm used to detect watermarks in the text. Different algorithms have different strengths and weaknesses."></i>
|
119 |
+
<label for="detectorType" class="form-label mb-0">Detector Type</label>
|
120 |
+
</div>
|
121 |
<select class="form-select" id="detectorType">
|
122 |
<option value="maryland">Maryland</option>
|
123 |
<option value="marylandz">Maryland Z-score</option>
|
|
|
127 |
<div class="form-text">Type of watermark detection algorithm</div>
|
128 |
</div>
|
129 |
<div class="mb-3">
|
130 |
+
<div class="d-flex align-items-center">
|
131 |
+
<i class="bi bi-info-circle param-help-icon me-2" data-bs-toggle="tooltip" title="The random seed used for watermarking. For detection to work, this must match the seed used during generation."></i>
|
132 |
+
<label for="seed" class="form-label mb-0">Seed</label>
|
133 |
+
</div>
|
134 |
<input type="number" class="form-control" id="seed" value="0">
|
135 |
<div class="form-text">Random seed for the watermark detector</div>
|
136 |
</div>
|
137 |
<div class="mb-3">
|
138 |
+
<div class="d-flex align-items-center">
|
139 |
+
<i class="bi bi-info-circle param-help-icon me-2" data-bs-toggle="tooltip" title="The number of previous tokens considered when determining the token distribution. Higher values are more secure but may affect quality."></i>
|
140 |
+
<label for="ngram" class="form-label mb-0">N-gram Size</label>
|
141 |
+
</div>
|
142 |
<input type="number" class="form-control" id="ngram" value="1">
|
143 |
<div class="form-text">Size of the n-gram window used for detection</div>
|
144 |
</div>
|
145 |
<div class="mb-3">
|
146 |
+
<div class="d-flex align-items-center">
|
147 |
+
<i class="bi bi-info-circle param-help-icon me-2" data-bs-toggle="tooltip" title="The bias added to greenlist tokens during generation. Higher values (2.0-5.0) make watermarks easier to detect but might affect text quality."></i>
|
148 |
+
<label for="delta" class="form-label mb-0">Delta</label>
|
149 |
+
</div>
|
150 |
<input type="number" step="0.1" class="form-control" id="delta" value="2.0">
|
151 |
<div class="form-text">Bias added to greenlist tokens (for Maryland method)</div>
|
152 |
</div>
|
153 |
<div class="mb-3">
|
154 |
+
<div class="d-flex align-items-center">
|
155 |
+
<i class="bi bi-info-circle param-help-icon me-2" data-bs-toggle="tooltip" title="Controls randomness in generation. Higher values (closer to 1.0) create more diverse outputs but might make watermarks harder to detect."></i>
|
156 |
+
<label for="temperature" class="form-label mb-0">Temperature</label>
|
157 |
+
</div>
|
158 |
<input type="number" step="0.1" class="form-control" id="temperature" value="0.8">
|
159 |
<div class="form-text">Temperature for sampling (higher = more random)</div>
|
160 |
</div>
|
|
|
240 |
const deltaInput = document.getElementById('delta');
|
241 |
const temperatureInput = document.getElementById('temperature');
|
242 |
|
243 |
+
// Initialize tooltips
|
244 |
+
document.addEventListener('DOMContentLoaded', function() {
|
245 |
+
// Initialize Bootstrap tooltips
|
246 |
+
const tooltipTriggerList = [].slice.call(document.querySelectorAll('[data-bs-toggle="tooltip"]'));
|
247 |
+
const tooltipList = tooltipTriggerList.map(function (tooltipTriggerEl) {
|
248 |
+
return new bootstrap.Tooltip(tooltipTriggerEl);
|
249 |
+
});
|
250 |
+
|
251 |
+
// Initialize our tokenization
|
252 |
+
updateTokenization().catch(error => {
|
253 |
+
console.error('Error during initial tokenization:', error);
|
254 |
+
});
|
255 |
+
});
|
256 |
+
|
257 |
function startGeneration() {
|
258 |
const prompt = promptArea.value.trim();
|
259 |
if (!prompt) {
|
|
|
556 |
});
|
557 |
});
|
558 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
559 |
// Add this helper function for formatting p-values
|
560 |
function formatPValue(value) {
|
561 |
if (value >= 0.001) {
|