Spaces:
Running
Running
Use trajectories_with_cognitive_map_probe_examples dataset
Browse filesLoad trajectories with probe predictions from project-telos/trajectories_with_cognitive_map_probe_examples,
with pre/post-reasoning, size (7/11/15), complexity, and index selectors.
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
- README.md +1 -1
- index.html +10 -4
README.md
CHANGED
|
@@ -10,7 +10,7 @@ license: apache-2.0
|
|
| 10 |
|
| 11 |
Interactive trace viewer for visualizing language model agent trajectories in 2D grid environments, with probing results overlaid on tokens.
|
| 12 |
|
| 13 |
-
Trajectories can be loaded directly from the [project-telos/
|
| 14 |
|
| 15 |
Part of the paper: [A Behavioural and Representational Evaluation of Goal-Directedness in Language Model Agents](https://arxiv.org/abs/2602.08964).
|
| 16 |
|
|
|
|
| 10 |
|
| 11 |
Interactive trace viewer for visualizing language model agent trajectories in 2D grid environments, with probing results overlaid on tokens.
|
| 12 |
|
| 13 |
+
Trajectories with probe predictions can be loaded directly from the [project-telos/trajectories_with_cognitive_map_probe_examples](https://huggingface.co/datasets/project-telos/trajectories_with_cognitive_map_probe_examples) dataset, or uploaded as JSON files.
|
| 14 |
|
| 15 |
Part of the paper: [A Behavioural and Representational Evaluation of Goal-Directedness in Language Model Agents](https://arxiv.org/abs/2602.08964).
|
| 16 |
|
index.html
CHANGED
|
@@ -750,12 +750,15 @@
|
|
| 750 |
<div class="controls">
|
| 751 |
<div class="hf-loader">
|
| 752 |
<span class="hf-icon">🤗</span>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 753 |
<label>Size:</label>
|
| 754 |
<select id="hfSize">
|
| 755 |
<option value="7">7</option>
|
| 756 |
-
<option value="9">9</option>
|
| 757 |
<option value="11">11</option>
|
| 758 |
-
<option value="13">13</option>
|
| 759 |
<option value="15">15</option>
|
| 760 |
</select>
|
| 761 |
<label>Complexity:</label>
|
|
@@ -881,6 +884,7 @@
|
|
| 881 |
const helpHeader = document.getElementById('helpHeader');
|
| 882 |
const helpContent = document.getElementById('helpContent');
|
| 883 |
const layerSelector = document.getElementById('layerSelector');
|
|
|
|
| 884 |
const hfSize = document.getElementById('hfSize');
|
| 885 |
const hfComplexity = document.getElementById('hfComplexity');
|
| 886 |
const hfIndex = document.getElementById('hfIndex');
|
|
@@ -1019,11 +1023,12 @@
|
|
| 1019 |
});
|
| 1020 |
|
| 1021 |
hfLoadBtn.addEventListener('click', async () => {
|
|
|
|
| 1022 |
const size = hfSize.value;
|
| 1023 |
const comp = hfComplexity.value;
|
| 1024 |
const idx = hfIndex.value;
|
| 1025 |
const fileName = `together_ai_openai_gpt-oss-20b_size${size}_comp${comp}_${idx}.json`;
|
| 1026 |
-
const url = `https://huggingface.co/datasets/project-telos/
|
| 1027 |
|
| 1028 |
hfLoadBtn.disabled = true;
|
| 1029 |
hfLoadBtn.textContent = 'Loading...';
|
|
@@ -1033,7 +1038,8 @@
|
|
| 1033 |
throw new Error(`Failed to fetch trajectory (${response.status})`);
|
| 1034 |
}
|
| 1035 |
const data = await response.json();
|
| 1036 |
-
|
|
|
|
| 1037 |
} catch (error) {
|
| 1038 |
alert('Error loading from HuggingFace: ' + error.message);
|
| 1039 |
console.error(error);
|
|
|
|
| 750 |
<div class="controls">
|
| 751 |
<div class="hf-loader">
|
| 752 |
<span class="hf-icon">🤗</span>
|
| 753 |
+
<label>Probes:</label>
|
| 754 |
+
<select id="hfProbeType">
|
| 755 |
+
<option value="pre_reasoning">Pre-reasoning</option>
|
| 756 |
+
<option value="post_reasoning">Post-reasoning</option>
|
| 757 |
+
</select>
|
| 758 |
<label>Size:</label>
|
| 759 |
<select id="hfSize">
|
| 760 |
<option value="7">7</option>
|
|
|
|
| 761 |
<option value="11">11</option>
|
|
|
|
| 762 |
<option value="15">15</option>
|
| 763 |
</select>
|
| 764 |
<label>Complexity:</label>
|
|
|
|
| 884 |
const helpHeader = document.getElementById('helpHeader');
|
| 885 |
const helpContent = document.getElementById('helpContent');
|
| 886 |
const layerSelector = document.getElementById('layerSelector');
|
| 887 |
+
const hfProbeType = document.getElementById('hfProbeType');
|
| 888 |
const hfSize = document.getElementById('hfSize');
|
| 889 |
const hfComplexity = document.getElementById('hfComplexity');
|
| 890 |
const hfIndex = document.getElementById('hfIndex');
|
|
|
|
| 1023 |
});
|
| 1024 |
|
| 1025 |
hfLoadBtn.addEventListener('click', async () => {
|
| 1026 |
+
const probeType = hfProbeType.value;
|
| 1027 |
const size = hfSize.value;
|
| 1028 |
const comp = hfComplexity.value;
|
| 1029 |
const idx = hfIndex.value;
|
| 1030 |
const fileName = `together_ai_openai_gpt-oss-20b_size${size}_comp${comp}_${idx}.json`;
|
| 1031 |
+
const url = `https://huggingface.co/datasets/project-telos/trajectories_with_cognitive_map_probe_examples/resolve/main/${probeType}/size${size}/${fileName}`;
|
| 1032 |
|
| 1033 |
hfLoadBtn.disabled = true;
|
| 1034 |
hfLoadBtn.textContent = 'Loading...';
|
|
|
|
| 1038 |
throw new Error(`Failed to fetch trajectory (${response.status})`);
|
| 1039 |
}
|
| 1040 |
const data = await response.json();
|
| 1041 |
+
const shortProbe = probeType === 'pre_reasoning' ? 'pre' : 'post';
|
| 1042 |
+
loadTrajectoryData(data, `${shortProbe}_s${size}_c${comp}_${idx}`);
|
| 1043 |
} catch (error) {
|
| 1044 |
alert('Error loading from HuggingFace: ' + error.message);
|
| 1045 |
console.error(error);
|