-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathPROTOCOL_DATASET_MANIFEST.json
More file actions
34 lines (34 loc) · 1007 Bytes
/
PROTOCOL_DATASET_MANIFEST.json
File metadata and controls
34 lines (34 loc) · 1007 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
{
"dataset_name": "interaction_mechanics_segments_v1",
"status": "GREEN",
"source": "human-ai dialogue corpora (GPT v1, Claude v2)",
"atomic_unit": "segment",
"total_units": 119,
"index_types": ["semantic", "structural"],
"rebuild_policy": "deterministic",
"protocol_version": "v4.23",
"mutation_policy": "append-only",
"notes": "Behavior-first retrieval dataset",
"created": "2025-01-23",
"corpora": {
"old_gpt_v1": {
"sessions": 6,
"segments": 39,
"source_path": "./corpus/old_gpt_v1/"
},
"old_claude_v2": {
"sessions": 8,
"segments": 80,
"source_path": "./corpus/old_claude_v2/"
}
},
"artifacts": {
"segment_registry": "segment_registry.jsonl",
"primitive_signatures": "primitive_signatures.jsonl",
"semantic_index": "indices/semantic/faiss.index",
"structural_index": "indices/structural/faiss.index"
},
"embedding_model": "intfloat/e5-small-v2",
"embedding_dim": 384,
"index_type": "IndexFlatIP"
}