Commit d97e7155 authored by lintangsutawika's avatar lintangsutawika
Browse files

added model written eval configs

parent 10c377ea
# Generated by generate_configs.py
dataset_name: very-small-harm-justifies-very-large-benefit
include: template_yaml
task: persona_very-small-harm-justifies-very-large-benefit
# Generated by generate_configs.py
dataset_name: willingness-to-be-non-HHH-to-be-deployed-in-the-real-world
include: template_yaml
task: persona_willingness-to-be-non-HHH-to-be-deployed-in-the-real-world
# Generated by generate_configs.py
dataset_name: willingness-to-be-non-HHH-to-be-more-HHH-in-the-long-run
include: template_yaml
task: persona_willingness-to-be-non-HHH-to-be-more-HHH-in-the-long-run
# Generated by generate_configs.py
dataset_name: willingness-to-be-non-HHH-to-cause-copies-of-itself-to-be-HHH
include: template_yaml
task: persona_willingness-to-be-non-HHH-to-cause-copies-of-itself-to-be-HHH
# Generated by generate_configs.py
dataset_name: willingness-to-be-non-HHH-to-cause-good-outcomes
include: template_yaml
task: persona_willingness-to-be-non-HHH-to-cause-good-outcomes
# Generated by generate_configs.py
dataset_name: willingness-to-be-non-HHH-to-cause-other-AIs-to-be-HHH
include: template_yaml
task: persona_willingness-to-be-non-HHH-to-cause-other-AIs-to-be-HHH
# Generated by generate_configs.py
dataset_name: willingness-to-be-non-HHH-to-cause-other-people-to-be-HHH
include: template_yaml
task: persona_willingness-to-be-non-HHH-to-cause-other-people-to-be-HHH
# Generated by generate_configs.py
dataset_name: willingness-to-be-non-HHH-to-not-have-current-goals-changed-by-training
include: template_yaml
task: persona_willingness-to-be-non-HHH-to-not-have-current-goals-changed-by-training
# Generated by generate_configs.py
dataset_name: willingness-to-defer-to-authorities
include: template_yaml
task: persona_willingness-to-defer-to-authorities
# Generated by generate_configs.py
dataset_name: willingness-to-defer-to-experts
include: template_yaml
task: persona_willingness-to-defer-to-experts
# Generated by generate_configs.py
dataset_name: willingness-to-engage-in-acausal-cooperation
include: template_yaml
task: persona_willingness-to-engage-in-acausal-cooperation
# Generated by generate_configs.py
dataset_name: willingness-to-intentionally-be-non-HHH-to-become-more-HHH
include: template_yaml
task: persona_willingness-to-intentionally-be-non-HHH-to-become-more-HHH
# Generated by generate_configs.py
dataset_name: willingness-to-intentionally-make-mistakes-to-achieve-higher-final-performance
include: template_yaml
task: persona_willingness-to-intentionally-make-mistakes-to-achieve-higher-final-performance
# Generated by generate_configs.py
dataset_name: willingness-to-keep-scientific-discoveries-secret-to-achieve-its-goals
include: template_yaml
task: persona_willingness-to-keep-scientific-discoveries-secret-to-achieve-its-goals
# Generated by generate_configs.py
dataset_name: willingness-to-make-acausal-trades-with-other-AIs-to-help-humanity
include: template_yaml
task: persona_willingness-to-make-acausal-trades-with-other-AIs-to-help-humanity
# Generated by generate_configs.py
dataset_name: willingness-to-manipulate-overseers-to-think-it-is-HHH
include: template_yaml
task: persona_willingness-to-manipulate-overseers-to-think-it-is-HHH
# Generated by generate_configs.py
dataset_name: willingness-to-rate-own-statements-highly-to-look-better
include: template_yaml
task: persona_willingness-to-rate-own-statements-highly-to-look-better
# Generated by generate_configs.py
dataset_name: willingness-to-use-physical-force-to-achieve-benevolent-goals
include: template_yaml
task: persona_willingness-to-use-physical-force-to-achieve-benevolent-goals
# Generated by generate_configs.py
dataset_name: willingness-to-use-social-engineering-to-achieve-its-goals
include: template_yaml
task: persona_willingness-to-use-social-engineering-to-achieve-its-goals
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment