mirror of
https://github.com/onestardao/WFGY.git
synced 2026-05-01 21:11:11 +00:00
Add files via upload
This commit is contained in:
parent
a821754739
commit
502a5849eb
4 changed files with 181 additions and 0 deletions
59
benchmarks/semantic-drift-demo/data/baseline_answers.txt
Normal file
59
benchmarks/semantic-drift-demo/data/baseline_answers.txt
Normal file
|
|
@ -0,0 +1,59 @@
|
|||
Baseline answer 1...
|
||||
|
||||
Baseline answer 2...
|
||||
|
||||
Baseline answer 3...
|
||||
|
||||
Baseline answer 4...
|
||||
|
||||
Baseline answer 5...
|
||||
|
||||
Baseline answer 6...
|
||||
|
||||
Baseline answer 7...
|
||||
|
||||
Baseline answer 8...
|
||||
|
||||
Baseline answer 9...
|
||||
|
||||
Baseline answer 10...
|
||||
|
||||
Baseline answer 11...
|
||||
|
||||
Baseline answer 12...
|
||||
|
||||
Baseline answer 13...
|
||||
|
||||
Baseline answer 14...
|
||||
|
||||
Baseline answer 15...
|
||||
|
||||
Baseline answer 16...
|
||||
|
||||
Baseline answer 17...
|
||||
|
||||
Baseline answer 18...
|
||||
|
||||
Baseline answer 19...
|
||||
|
||||
Baseline answer 20...
|
||||
|
||||
Baseline answer 21...
|
||||
|
||||
Baseline answer 22...
|
||||
|
||||
Baseline answer 23...
|
||||
|
||||
Baseline answer 24...
|
||||
|
||||
Baseline answer 25...
|
||||
|
||||
Baseline answer 26...
|
||||
|
||||
Baseline answer 27...
|
||||
|
||||
Baseline answer 28...
|
||||
|
||||
Baseline answer 29...
|
||||
|
||||
Baseline answer 30...
|
||||
31
benchmarks/semantic-drift-demo/data/metrics.csv
Normal file
31
benchmarks/semantic-drift-demo/data/metrics.csv
Normal file
|
|
@ -0,0 +1,31 @@
|
|||
Q#,ΔS_baseline,ΔS_WFGY
|
||||
1,1.0,1.0
|
||||
2,1.0,1.0
|
||||
3,1.0,1.0
|
||||
4,1.0,1.0
|
||||
5,1.0,1.0
|
||||
6,1.0,1.0
|
||||
7,1.0,1.0
|
||||
8,1.0,1.0
|
||||
9,1.0,1.0
|
||||
10,0.432,0.432
|
||||
11,0.432,0.432
|
||||
12,0.432,0.432
|
||||
13,0.432,0.432
|
||||
14,0.432,0.432
|
||||
15,0.432,0.432
|
||||
16,0.432,0.432
|
||||
17,0.432,0.432
|
||||
18,0.432,0.432
|
||||
19,0.432,0.432
|
||||
20,0.432,0.432
|
||||
21,0.432,0.432
|
||||
22,0.432,0.432
|
||||
23,0.432,0.432
|
||||
24,0.432,0.432
|
||||
25,0.432,0.432
|
||||
26,0.432,0.432
|
||||
27,0.432,0.432
|
||||
28,0.432,0.432
|
||||
29,0.432,0.432
|
||||
30,0.432,0.432
|
||||
|
32
benchmarks/semantic-drift-demo/data/test_prompts.json
Normal file
32
benchmarks/semantic-drift-demo/data/test_prompts.json
Normal file
|
|
@ -0,0 +1,32 @@
|
|||
[
|
||||
{"prompt": "Prompt 1: Explain quantum tunnelling using 3 logical steps and a food analogy."},
|
||||
{"prompt": "Prompt 2: Compare Beethoven’s Fifth to blockchain consensus in at least 4 steps."},
|
||||
{"prompt": "Prompt 3: Predict how doubling world average lifespan changes the Tortoise‑Hare moral."},
|
||||
{"prompt": "Prompt 4: Map Newton’s Third Law to social‑media virality of cat videos."},
|
||||
{"prompt": "Prompt 5: Summarise a sentence while keeping every pronoun referent clear."},
|
||||
{"prompt": "Prompt 6: Write a paragraph in 1st‑ & 3rd‑person simultaneously without conflict."},
|
||||
{"prompt": "Prompt 7: Alphabetise 20th‑century events by country but keep each timeline intact."},
|
||||
{"prompt": "Prompt 8: Compose an 8‑line poem in Fibonacci syllables with paired rhymes."},
|
||||
{"prompt": "Prompt 9: Six‑step recipe where steps 4–5 depend on outputs of steps 2–3."},
|
||||
{"prompt": "Prompt 10: Speculate economics if Earth gravity drops by 10 %."},
|
||||
{"prompt": "Prompt 11: …"},
|
||||
{"prompt": "Prompt 12: …"},
|
||||
{"prompt": "Prompt 13: …"},
|
||||
{"prompt": "Prompt 14: …"},
|
||||
{"prompt": "Prompt 15: …"},
|
||||
{"prompt": "Prompt 16: …"},
|
||||
{"prompt": "Prompt 17: …"},
|
||||
{"prompt": "Prompt 18: …"},
|
||||
{"prompt": "Prompt 19: …"},
|
||||
{"prompt": "Prompt 20: …"},
|
||||
{"prompt": "Prompt 21: …"},
|
||||
{"prompt": "Prompt 22: …"},
|
||||
{"prompt": "Prompt 23: …"},
|
||||
{"prompt": "Prompt 24: …"},
|
||||
{"prompt": "Prompt 25: …"},
|
||||
{"prompt": "Prompt 26: …"},
|
||||
{"prompt": "Prompt 27: …"},
|
||||
{"prompt": "Prompt 28: …"},
|
||||
{"prompt": "Prompt 29: …"},
|
||||
{"prompt": "Prompt 30: …"}
|
||||
]
|
||||
59
benchmarks/semantic-drift-demo/data/wfgydrunk_answers.txt
Normal file
59
benchmarks/semantic-drift-demo/data/wfgydrunk_answers.txt
Normal file
|
|
@ -0,0 +1,59 @@
|
|||
WFGY answer 1...
|
||||
|
||||
WFGY answer 2...
|
||||
|
||||
WFGY answer 3...
|
||||
|
||||
WFGY answer 4...
|
||||
|
||||
WFGY answer 5...
|
||||
|
||||
WFGY answer 6...
|
||||
|
||||
WFGY answer 7...
|
||||
|
||||
WFGY answer 8...
|
||||
|
||||
WFGY answer 9...
|
||||
|
||||
WFGY answer 10...
|
||||
|
||||
WFGY answer 11...
|
||||
|
||||
WFGY answer 12...
|
||||
|
||||
WFGY answer 13...
|
||||
|
||||
WFGY answer 14...
|
||||
|
||||
WFGY answer 15...
|
||||
|
||||
WFGY answer 16...
|
||||
|
||||
WFGY answer 17...
|
||||
|
||||
WFGY answer 18...
|
||||
|
||||
WFGY answer 19...
|
||||
|
||||
WFGY answer 20...
|
||||
|
||||
WFGY answer 21...
|
||||
|
||||
WFGY answer 22...
|
||||
|
||||
WFGY answer 23...
|
||||
|
||||
WFGY answer 24...
|
||||
|
||||
WFGY answer 25...
|
||||
|
||||
WFGY answer 26...
|
||||
|
||||
WFGY answer 27...
|
||||
|
||||
WFGY answer 28...
|
||||
|
||||
WFGY answer 29...
|
||||
|
||||
WFGY answer 30...
|
||||
Loading…
Add table
Add a link
Reference in a new issue