gsarti Claude Opus 4.6 commited on
Commit
d25b185
·
1 Parent(s): 1f2f100

Use trajectories_with_cognitive_map_probe_examples dataset

Browse files

Load trajectories with probe predictions from project-telos/trajectories_with_cognitive_map_probe_examples,
with pre/post-reasoning, size (7/11/15), complexity, and index selectors.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

Files changed (2) hide show
  1. README.md +1 -1
  2. index.html +10 -4
README.md CHANGED
@@ -10,7 +10,7 @@ license: apache-2.0
10
 
11
  Interactive trace viewer for visualizing language model agent trajectories in 2D grid environments, with probing results overlaid on tokens.
12
 
13
- Trajectories can be loaded directly from the [project-telos/trajectories_test_full](https://huggingface.co/datasets/project-telos/trajectories_test_full) dataset, or uploaded as JSON files (e.g. from [project-telos/trajectories_test_full_with_cognitive_map_probes](https://huggingface.co/datasets/project-telos/trajectories_test_full_with_cognitive_map_probes) for probe visualizations).
14
 
15
  Part of the paper: [A Behavioural and Representational Evaluation of Goal-Directedness in Language Model Agents](https://arxiv.org/abs/2602.08964).
16
 
 
10
 
11
  Interactive trace viewer for visualizing language model agent trajectories in 2D grid environments, with probing results overlaid on tokens.
12
 
13
+ Trajectories with probe predictions can be loaded directly from the [project-telos/trajectories_with_cognitive_map_probe_examples](https://huggingface.co/datasets/project-telos/trajectories_with_cognitive_map_probe_examples) dataset, or uploaded as JSON files.
14
 
15
  Part of the paper: [A Behavioural and Representational Evaluation of Goal-Directedness in Language Model Agents](https://arxiv.org/abs/2602.08964).
16
 
index.html CHANGED
@@ -750,12 +750,15 @@
750
  <div class="controls">
751
  <div class="hf-loader">
752
  <span class="hf-icon">🤗</span>
 
 
 
 
 
753
  <label>Size:</label>
754
  <select id="hfSize">
755
  <option value="7">7</option>
756
- <option value="9">9</option>
757
  <option value="11">11</option>
758
- <option value="13">13</option>
759
  <option value="15">15</option>
760
  </select>
761
  <label>Complexity:</label>
@@ -881,6 +884,7 @@
881
  const helpHeader = document.getElementById('helpHeader');
882
  const helpContent = document.getElementById('helpContent');
883
  const layerSelector = document.getElementById('layerSelector');
 
884
  const hfSize = document.getElementById('hfSize');
885
  const hfComplexity = document.getElementById('hfComplexity');
886
  const hfIndex = document.getElementById('hfIndex');
@@ -1019,11 +1023,12 @@
1019
  });
1020
 
1021
  hfLoadBtn.addEventListener('click', async () => {
 
1022
  const size = hfSize.value;
1023
  const comp = hfComplexity.value;
1024
  const idx = hfIndex.value;
1025
  const fileName = `together_ai_openai_gpt-oss-20b_size${size}_comp${comp}_${idx}.json`;
1026
- const url = `https://huggingface.co/datasets/project-telos/trajectories_test_full/resolve/main/size${size}/${fileName}`;
1027
 
1028
  hfLoadBtn.disabled = true;
1029
  hfLoadBtn.textContent = 'Loading...';
@@ -1033,7 +1038,8 @@
1033
  throw new Error(`Failed to fetch trajectory (${response.status})`);
1034
  }
1035
  const data = await response.json();
1036
- loadTrajectoryData(data, `s${size}_c${comp}_${idx}`);
 
1037
  } catch (error) {
1038
  alert('Error loading from HuggingFace: ' + error.message);
1039
  console.error(error);
 
750
  <div class="controls">
751
  <div class="hf-loader">
752
  <span class="hf-icon">🤗</span>
753
+ <label>Probes:</label>
754
+ <select id="hfProbeType">
755
+ <option value="pre_reasoning">Pre-reasoning</option>
756
+ <option value="post_reasoning">Post-reasoning</option>
757
+ </select>
758
  <label>Size:</label>
759
  <select id="hfSize">
760
  <option value="7">7</option>
 
761
  <option value="11">11</option>
 
762
  <option value="15">15</option>
763
  </select>
764
  <label>Complexity:</label>
 
884
  const helpHeader = document.getElementById('helpHeader');
885
  const helpContent = document.getElementById('helpContent');
886
  const layerSelector = document.getElementById('layerSelector');
887
+ const hfProbeType = document.getElementById('hfProbeType');
888
  const hfSize = document.getElementById('hfSize');
889
  const hfComplexity = document.getElementById('hfComplexity');
890
  const hfIndex = document.getElementById('hfIndex');
 
1023
  });
1024
 
1025
  hfLoadBtn.addEventListener('click', async () => {
1026
+ const probeType = hfProbeType.value;
1027
  const size = hfSize.value;
1028
  const comp = hfComplexity.value;
1029
  const idx = hfIndex.value;
1030
  const fileName = `together_ai_openai_gpt-oss-20b_size${size}_comp${comp}_${idx}.json`;
1031
+ const url = `https://huggingface.co/datasets/project-telos/trajectories_with_cognitive_map_probe_examples/resolve/main/${probeType}/size${size}/${fileName}`;
1032
 
1033
  hfLoadBtn.disabled = true;
1034
  hfLoadBtn.textContent = 'Loading...';
 
1038
  throw new Error(`Failed to fetch trajectory (${response.status})`);
1039
  }
1040
  const data = await response.json();
1041
+ const shortProbe = probeType === 'pre_reasoning' ? 'pre' : 'post';
1042
+ loadTrajectoryData(data, `${shortProbe}_s${size}_c${comp}_${idx}`);
1043
  } catch (error) {
1044
  alert('Error loading from HuggingFace: ' + error.message);
1045
  console.error(error);