promptbench
latest
Get Started
promptbench Introduction
Installation
Examples
Basic Usage
Multi-Modal Models
DyVal Evaluation
Prompt Attack
Prompt Engineering
Adding new modules
Reference
dataload
dyval
metrics
models
utils
Leaderboards
Adversarial Prompt Leaderboard
Dynamic Evaluation Benchmark
Prompt Engineering Benchmark
promptbench
Index
Edit on GitHub
Index
A
|
B
|
C
|
D
|
E
|
G
|
I
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
U
|
V
|
Y
A
abduct_node_value() (promptbench.dyval.DAG.logic_dag.AbductionDAG method)
AbductionDAG (class in promptbench.dyval.DAG.logic_dag)
AbductionDAGDescriber (class in promptbench.dyval.DAG.logic_dag)
add_rand_description() (promptbench.dyval.DAG.describer.BaseDAGDescriber method)
AI2D (class in promptbench.dataload.dataset)
ARC (class in promptbench.dataload.dataset)
ArithmeticDAG (class in promptbench.dyval.DAG.math_dag)
ArithmeticDAGDescriber (class in promptbench.dyval.DAG.math_dag)
B
BaichuanModel (class in promptbench.models.models)
BaseDAG (class in promptbench.dyval.DAG.dag)
BaseDAGDescriber (class in promptbench.dyval.DAG.describer)
basic_format() (promptbench.utils.dataprocess.InputProcess static method)
BBH (class in promptbench.dataload.dataset)
BigBench (class in promptbench.dataload.dataset)
BLIP2Model (class in promptbench.models.models)
BoolDAG (class in promptbench.dyval.DAG.logic_dag)
BoolDAGDescriber (class in promptbench.dyval.DAG.logic_dag)
BoolLogic (class in promptbench.dataload.dataset)
C
ChartQA (class in promptbench.dataload.dataset)
check_link_constraint() (promptbench.dyval.DAG.dag.BaseDAG method)
(promptbench.dyval.DAG.dag.TreeDAG method)
(promptbench.dyval.DAG.logic_dag.AbductionDAG method)
(promptbench.dyval.DAG.logic_dag.BoolDAG method)
(promptbench.dyval.DAG.logic_dag.DeductionDAG method)
(promptbench.dyval.DAG.math_dag.ArithmeticDAG method)
check_uni_ops() (promptbench.dyval.DAG.dag.TreeDAG method)
cls() (promptbench.utils.dataprocess.OutputProcess static method)
CodeDAG (class in promptbench.dyval.DAG.code_dag)
CodeDAGDescriber (class in promptbench.dyval.DAG.code_dag)
collect_nodes() (promptbench.dyval.DAG.dag.TreeDAG method)
compute_bleu() (promptbench.metrics.eval.Eval static method)
compute_cider() (promptbench.metrics.eval.Eval static method)
compute_cls_accuracy() (promptbench.metrics.eval.Eval static method)
compute_math_accuracy() (promptbench.metrics.eval.Eval static method)
compute_squad_v2_f1() (promptbench.metrics.eval.Eval static method)
compute_vqa_accuracy() (promptbench.metrics.eval.Eval static method)
create_dataset() (promptbench.dyval.dyval_dataset.DyValDataset method)
CSQA (class in promptbench.dataload.dataset)
D
Dataset (class in promptbench.dataload.dataset)
DatasetLoader (class in promptbench.dataload.dataload)
DeductionDAG (class in promptbench.dyval.DAG.logic_dag)
DeductionDAGDescriber (class in promptbench.dyval.DAG.logic_dag)
delete_description() (promptbench.dyval.DAG.describer.BaseDAGDescriber method)
describe_abduction() (promptbench.dyval.DAG.logic_dag.AbductionDAGDescriber method)
describe_answer() (promptbench.dyval.DAG.code_dag.CodeDAGDescriber method)
(promptbench.dyval.DAG.describer.GeneralDAGDescriber method)
(promptbench.dyval.DAG.describer.TreeDAGDescriber method)
(promptbench.dyval.DAG.logic_dag.AbductionDAGDescriber method)
(promptbench.dyval.DAG.math_dag.LinearEq method)
describe_inference_node() (promptbench.dyval.DAG.describer.TreeDAGDescriber method)
(promptbench.dyval.DAG.logic_dag.BoolDAGDescriber method)
(promptbench.dyval.DAG.logic_dag.DeductionDAGDescriber method)
(promptbench.dyval.DAG.math_dag.ArithmeticDAGDescriber method)
describe_inference_steps() (promptbench.dyval.DAG.code_dag.CodeDAGDescriber method)
(promptbench.dyval.DAG.describer.TreeDAGDescriber method)
(promptbench.dyval.DAG.logic_dag.AbductionDAGDescriber method)
(promptbench.dyval.DAG.math_dag.LinearEq method)
describe_max_sum_path() (promptbench.dyval.DAG.code_dag.CodeDAGDescriber method)
describe_question() (promptbench.dyval.DAG.code_dag.CodeDAGDescriber method)
(promptbench.dyval.DAG.describer.TreeDAGDescriber method)
(promptbench.dyval.DAG.logic_dag.AbductionDAGDescriber method)
(promptbench.dyval.DAG.math_dag.LinearEq method)
describe_question_node() (promptbench.dyval.DAG.describer.BaseDAGDescriber method)
(promptbench.dyval.DAG.describer.GeneralDAGDescriber method)
(promptbench.dyval.DAG.logic_dag.AbductionDAGDescriber method)
(promptbench.dyval.DAG.logic_dag.BoolDAGDescriber method)
(promptbench.dyval.DAG.logic_dag.DeductionDAGDescriber method)
(promptbench.dyval.DAG.math_dag.ArithmeticDAGDescriber method)
describe_reachability() (promptbench.dyval.DAG.code_dag.CodeDAGDescriber method)
DROP (class in promptbench.dataload.dataset)
dyval_evaluate() (in module promptbench.dyval.dyval_utils)
DyValDataset (class in promptbench.dyval.dyval_dataset)
E
Eval (class in promptbench.metrics.eval)
extract_answer() (promptbench.dataload.dataset.BigBench method)
(promptbench.dataload.dataset.CSQA method)
(promptbench.dataload.dataset.Dataset method)
(promptbench.dataload.dataset.GSM8K method)
(promptbench.dataload.dataset.QASC method)
G
GeminiModel (class in promptbench.models.models)
GeminiVisionModel (class in promptbench.models.models)
general() (promptbench.utils.dataprocess.OutputProcess static method)
GeneralDAG (class in promptbench.dyval.DAG.dag)
GeneralDAGDescriber (class in promptbench.dyval.DAG.describer)
generate_cycles() (promptbench.dyval.DAG.dag.BaseDAG method)
generate_dag() (promptbench.dyval.DAG.dag.GeneralDAG method)
(promptbench.dyval.DAG.dag.TreeDAG method)
generate_rand_description() (promptbench.dyval.DAG.describer.BaseDAGDescriber method)
(promptbench.dyval.DAG.describer.GeneralDAGDescriber method)
(promptbench.dyval.DAG.describer.TreeDAGDescriber method)
generate_tree() (promptbench.dyval.DAG.dag.TreeDAG method)
(promptbench.dyval.DAG.logic_dag.AbductionDAG method)
(promptbench.dyval.DAG.logic_dag.BoolDAG method)
(promptbench.dyval.DAG.logic_dag.DeductionDAG method)
(promptbench.dyval.DAG.math_dag.ArithmeticDAG method)
get_fewshot_examples() (promptbench.dyval.dyval_dataset.DyValDataset method)
get_node_by_name() (promptbench.dyval.DAG.dag.BaseDAG method)
GLUE (class in promptbench.dataload.dataset)
GSM8K (class in promptbench.dataload.dataset)
I
InputProcess (class in promptbench.utils.dataprocess)
InternLMVisionModel (class in promptbench.models.models)
IWSLT (class in promptbench.dataload.dataset)
L
LastLetterConcat (class in promptbench.dataload.dataset)
LinearEq (class in promptbench.dyval.DAG.math_dag)
LlamaModel (class in promptbench.models.models)
LLaVAModel (class in promptbench.models.models)
LMMBaseModel (class in promptbench.models.models)
load_dataset() (promptbench.dataload.dataload.DatasetLoader static method)
M
Math (class in promptbench.dataload.dataset)
MathVista (class in promptbench.dataload.dataset)
max_sum_path() (promptbench.dyval.DAG.code_dag.CodeDAG method)
MistralModel (class in promptbench.models.models)
MixtralModel (class in promptbench.models.models)
MMLU (class in promptbench.dataload.dataset)
MMMU (class in promptbench.dataload.dataset)
module
promptbench.dataload.dataload
promptbench.dataload.dataset
promptbench.dyval.DAG.code_dag
promptbench.dyval.DAG.dag
promptbench.dyval.DAG.describer
promptbench.dyval.DAG.logic_dag
promptbench.dyval.DAG.math_dag
promptbench.dyval.dyval_dataset
promptbench.dyval.dyval_utils
promptbench.metrics.eval
promptbench.models.models
promptbench.utils.dataprocess
N
NoCaps (class in promptbench.dataload.dataset)
Node (class in promptbench.dyval.DAG.dag)
NumerSense (class in promptbench.dataload.dataset)
O
OpenAIModel (class in promptbench.models.models)
OpenAIVisionModel (class in promptbench.models.models)
OutputProcess (class in promptbench.utils.dataprocess)
P
PaLMModel (class in promptbench.models.models)
pattern_re() (promptbench.utils.dataprocess.OutputProcess static method)
pattern_split() (promptbench.utils.dataprocess.OutputProcess static method)
PhiModel (class in promptbench.models.models)
predict() (promptbench.models.models.GeminiModel method)
(promptbench.models.models.GeminiVisionModel method)
(promptbench.models.models.InternLMVisionModel method)
(promptbench.models.models.LlamaModel method)
(promptbench.models.models.LMMBaseModel method)
(promptbench.models.models.OpenAIModel method)
(promptbench.models.models.OpenAIVisionModel method)
(promptbench.models.models.PaLMModel method)
(promptbench.models.models.PhiModel method)
(promptbench.models.models.QwenVLModel method)
(promptbench.models.models.VicunaModel method)
(promptbench.models.models.VLMBaseModel method)
process_dyval_inputs() (in module promptbench.dyval.dyval_utils)
process_dyval_preds() (in module promptbench.dyval.dyval_utils)
process_dyval_training_sample() (in module promptbench.dyval.dyval_utils)
promptbench.dataload.dataload
module
promptbench.dataload.dataset
module
promptbench.dyval.DAG.code_dag
module
promptbench.dyval.DAG.dag
module
promptbench.dyval.DAG.describer
module
promptbench.dyval.DAG.logic_dag
module
promptbench.dyval.DAG.math_dag
module
promptbench.dyval.dyval_dataset
module
promptbench.dyval.dyval_utils
module
promptbench.metrics.eval
module
promptbench.models.models
module
promptbench.utils.dataprocess
module
Q
QASC (class in promptbench.dataload.dataset)
QwenVLModel (class in promptbench.models.models)
R
random_traversal() (promptbench.dyval.DAG.describer.BaseDAGDescriber method)
reachability() (promptbench.dyval.DAG.code_dag.CodeDAG method)
reverse_topological_traversal() (promptbench.dyval.DAG.describer.BaseDAGDescriber method)
round_value() (in module promptbench.dyval.dyval_utils)
S
ScienceQA (class in promptbench.dataload.dataset)
shuffleDict() (in module promptbench.dataload.dataset)
SQUAD_V2 (class in promptbench.dataload.dataset)
T
T5Model (class in promptbench.models.models)
topological_sort() (promptbench.dyval.DAG.dag.BaseDAG method)
topological_traversal() (promptbench.dyval.DAG.describer.BaseDAGDescriber method)
TreeDAG (class in promptbench.dyval.DAG.dag)
TreeDAGDescriber (class in promptbench.dyval.DAG.describer)
U
UL2Model (class in promptbench.models.models)
UnMulti (class in promptbench.dataload.dataset)
update_values() (promptbench.dyval.DAG.dag.TreeDAG method)
(promptbench.dyval.DAG.logic_dag.AbductionDAG method)
(promptbench.dyval.DAG.logic_dag.BoolDAG method)
(promptbench.dyval.DAG.logic_dag.DeductionDAG method)
(promptbench.dyval.DAG.math_dag.ArithmeticDAG method)
V
ValidParentheses (class in promptbench.dataload.dataset)
VicunaModel (class in promptbench.models.models)
VLMBaseModel (class in promptbench.models.models)
VQAv2 (class in promptbench.dataload.dataset)
Y
YiModel (class in promptbench.models.models)
Read the Docs
v: latest
Versions
latest
Downloads
On Read the Docs
Project Home
Builds