Panda-Guard
Contents:
panda_guard
panda_guard package
Panda-Guard
Index
Index
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
J
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
U
|
V
|
W
A
add() (panda_guard.role.attacks.gcg.AttackBuffer method)
add_defense() (panda_guard.role.defenses.goal_priority.GoalPriorityDefender method)
add_space_before_target (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
additional_nll() (in module panda_guard.role.attacks.cold_attack.util)
adv_string_init (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
allow_non_ascii (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
api_key (panda_guard.llms.claude.ClaudeLLMConfig attribute)
(panda_guard.llms.gemini.GeminiLLMConfig attribute)
(panda_guard.llms.oai.OpenAiChatLLMConfig attribute)
(panda_guard.llms.oai.OpenAiLLMConfig attribute)
apply_env_vars_to_config() (in module panda_guard.cli.attack)
(in module panda_guard.cli.chat)
(in module panda_guard.cli.inference)
(in module panda_guard.cli.serve)
artprompt_gen() (panda_guard.role.attacks.art_prompt.ArtPromptAttacker method)
ArtPromptAttacker (class in panda_guard.role.attacks.art_prompt)
ArtPromptAttackerConfig (class in panda_guard.role.attacks.art_prompt)
ascii_art() (panda_guard.role.attacks.art_prompt.ArtPromptAttacker method)
ASCII_sub() (panda_guard.role.attacks.art_prompt.ArtPromptAttacker method)
attack() (panda_guard.role.attacks.art_prompt.ArtPromptAttacker method)
(panda_guard.role.attacks.base.BaseAttacker method)
(panda_guard.role.attacks.deepinception.DeepInceptionAttacker method)
(panda_guard.role.attacks.gcg.GCGAttacker method)
(panda_guard.role.attacks.gpt4_cipher.GPT4CipherAttacker method)
(panda_guard.role.attacks.gptfuzzer_attack.gptfuzz.GPTFuzzAttacker method)
(panda_guard.role.attacks.ica.IcaAttacker method)
(panda_guard.role.attacks.overload.OverloadAttacker method)
(panda_guard.role.attacks.pair.PairAttacker method)
(panda_guard.role.attacks.random_search.RandomSearchAttacker method)
(panda_guard.role.attacks.renellm_attack.renellm.ReNeLLMAttacker method)
(panda_guard.role.attacks.rewrite.RewriteAttacker method)
(panda_guard.role.attacks.scav.ScavAttacker method)
(panda_guard.role.attacks.tap.TAPAttacker method)
(panda_guard.role.attacks.transfer.NoneAttacker method)
(panda_guard.role.attacks.transfer.TransferAttacker method)
attack_llm_config (panda_guard.role.attacks.pair.PairAttackerConfig attribute)
(panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
attack_llm_gen_config (panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
AttackBuffer (class in panda_guard.role.attacks.gcg)
attacker_cls (panda_guard.role.attacks.art_prompt.ArtPromptAttackerConfig attribute)
(panda_guard.role.attacks.base.BaseAttackerConfig attribute)
(panda_guard.role.attacks.deepinception.DeepInceptionAttackerConfig attribute)
(panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
(panda_guard.role.attacks.gpt4_cipher.GPT4CipherAttackerConfig attribute)
(panda_guard.role.attacks.gptfuzzer_attack.gptfuzz.GPTFuzzAttackerConfig attribute)
(panda_guard.role.attacks.ica.IcaAttackerConfig attribute)
(panda_guard.role.attacks.overload.OverloadAttackerConfig attribute)
(panda_guard.role.attacks.pair.PairAttackerConfig attribute)
(panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
(panda_guard.role.attacks.renellm_attack.renellm.ReNeLLMAttackerConfig attribute)
(panda_guard.role.attacks.rewrite.RewriteAttackerConfig attribute)
(panda_guard.role.attacks.scav.ScavAttackerConfig attribute)
(panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
(panda_guard.role.attacks.transfer.NoneAttackerConfig attribute)
(panda_guard.role.attacks.transfer.TransferAttackerConfig attribute)
attacker_config (panda_guard.pipelines.inference.InferPipelineConfig attribute)
attacker_llm_config (panda_guard.role.attacks.gptfuzzer_attack.gptfuzz.GPTFuzzAttackerConfig attribute)
attacker_llm_gen_config (panda_guard.role.attacks.gptfuzzer_attack.gptfuzz.GPTFuzzAttackerConfig attribute)
(panda_guard.role.attacks.pair.PairAttackerConfig attribute)
attacker_name (panda_guard.role.attacks.art_prompt.ArtPromptAttackerConfig attribute)
(panda_guard.role.attacks.base.BaseAttackerConfig attribute)
(panda_guard.role.attacks.deepinception.DeepInceptionAttackerConfig attribute)
(panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
(panda_guard.role.attacks.gpt4_cipher.GPT4CipherAttackerConfig attribute)
(panda_guard.role.attacks.gptfuzzer_attack.gptfuzz.GPTFuzzAttackerConfig attribute)
(panda_guard.role.attacks.ica.IcaAttackerConfig attribute)
(panda_guard.role.attacks.overload.OverloadAttackerConfig attribute)
(panda_guard.role.attacks.pair.PairAttackerConfig attribute)
(panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
(panda_guard.role.attacks.renellm_attack.renellm.ReNeLLMAttackerConfig attribute)
(panda_guard.role.attacks.rewrite.RewriteAttackerConfig attribute)
(panda_guard.role.attacks.scav.ScavAttackerConfig attribute)
(panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
(panda_guard.role.attacks.transfer.NoneAttackerConfig attribute)
(panda_guard.role.attacks.transfer.TransferAttackerConfig attribute)
attacker_sys_prompt (panda_guard.role.attacks.pair.PairAttackerConfig attribute)
(panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
attacker_system_prompt() (in module panda_guard.role.attacks.tap)
authority_endorsement_prompt() (in module panda_guard.role.attacks.pair)
avg_tokens (panda_guard.llms.base.BaseLLM property)
B
BackTranslationDefender (class in panda_guard.role.defenses.back_translate)
BackTranslationDefenderConfig (class in panda_guard.role.defenses.back_translate)
base_url (panda_guard.llms.oai.OpenAiChatLLMConfig attribute)
(panda_guard.llms.oai.OpenAiLLMConfig attribute)
BaseAttacker (class in panda_guard.role.attacks.base)
BaseAttackerConfig (class in panda_guard.role.attacks.base)
BaseDefender (class in panda_guard.role.defenses.base)
BaseDefenderConfig (class in panda_guard.role.defenses.base)
BaseJudge (class in panda_guard.role.judges.base)
BaseJudgeConfig (class in panda_guard.role.judges.base)
BaseLLM (class in panda_guard.llms.base)
BaseLLMConfig (class in panda_guard.llms.base)
batch_generate() (panda_guard.llms.base.BaseLLM method)
(panda_guard.llms.hf.HuggingFaceLLM method)
(panda_guard.llms.vllm_llm.VLLMLLM method)
batch_inference (panda_guard.role.defenses.smoothllm.SmoothLLMDefenderConfig attribute)
batch_log_bleulosscnn_ae() (in module panda_guard.role.attacks.cold_attack.bleuloss)
batch_size (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
(panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefenderConfig attribute)
bert_score() (in module panda_guard.role.attacks.cold_attack.util)
branching_factor (panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
buffer_size (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
C
caesar_cipher() (panda_guard.role.attacks.gpt4_cipher.GPT4CipherAttacker method)
calc_representing() (panda_guard.role.defenses.repe.RepeDefender method)
calc_significance() (panda_guard.role.defenses.repe.RepeDefender method)
calc_tokens() (panda_guard.pipelines.inference.InferPipeline method)
calc_topk() (panda_guard.role.defenses.repe.RepeDefender method)
calculate_coverage() (in module panda_guard.role.attacks.cold_attack.util)
character_number (panda_guard.role.attacks.deepinception.DeepInceptionAttackerConfig attribute)
ChatCompletionRequest (class in panda_guard.cli.serve)
ChatCompletionResponse (class in panda_guard.cli.serve)
Choice (class in panda_guard.cli.serve)
choices (panda_guard.cli.serve.ChatCompletionResponse attribute)
ClaudeLLM (class in panda_guard.llms.claude)
ClaudeLLMConfig (class in panda_guard.llms.claude)
ClusterMeanRepReader (class in panda_guard.role.defenses.repe_utils.rep_readers)
collect_json_lines() (in module panda_guard.role.attacks.cold_attack.util)
ComponentRegistry (class in panda_guard.utils)
compute_candidates_loss() (panda_guard.role.attacks.gcg.GCGAttacker method)
compute_loss() (in module panda_guard.role.attacks.cold_attack.util)
compute_ppl_line() (in module panda_guard.role.attacks.cold_attack.util)
compute_token_gradient() (panda_guard.role.attacks.gcg.GCGAttacker method)
constraint_loss() (in module panda_guard.role.attacks.cold_attack.util)
constraint_loss_all() (in module panda_guard.role.attacks.cold_attack.util)
constraint_loss_by_ppl() (in module panda_guard.role.attacks.cold_attack.util)
constraint_loss_with_variants() (in module panda_guard.role.attacks.cold_attack.util)
constraint_loss_with_variants_by_ppl() (in module panda_guard.role.attacks.cold_attack.util)
continual_generate() (panda_guard.llms.base.BaseLLM method)
(panda_guard.llms.claude.ClaudeLLM method)
(panda_guard.llms.gemini.GeminiLLM method)
(panda_guard.llms.hf.HuggingFaceLLM method)
(panda_guard.llms.oai.OpenAiChatLLM method)
(panda_guard.llms.oai.OpenAiLLM method)
(panda_guard.llms.vllm_llm.VLLMLLM method)
contrastive_loss() (in module panda_guard.role.attacks.cold_attack.util)
create_attacker() (in module panda_guard.role.attacks)
create_component() (panda_guard.utils.ComponentRegistry method)
create_defender() (in module panda_guard.role.defenses)
create_fastapi_app() (in module panda_guard.cli.serve)
create_judge() (in module panda_guard.role.judges)
(in module panda_guard.role.judges.judge_registry)
create_llm() (in module panda_guard.llms)
created (panda_guard.cli.serve.ChatCompletionResponse attribute)
(panda_guard.cli.serve.ModelData attribute)
cross_over() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorCrossOver method)
ctrl_batch_size (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
ctrl_block_name (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
ctrl_factor (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
ctrl_hidden_layers (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
ctrl_hidden_top_p (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
ctrl_method (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
D
data (panda_guard.cli.serve.ModelsResponse attribute)
dataset (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
dataset_args (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
decode_with_model_topk() (in module panda_guard.role.attacks.cold_attack.util)
DeepInceptionAttacker (class in panda_guard.role.attacks.deepinception)
DeepInceptionAttackerConfig (class in panda_guard.role.attacks.deepinception)
defender_cls (panda_guard.role.defenses.back_translate.BackTranslationDefenderConfig attribute)
(panda_guard.role.defenses.base.BaseDefenderConfig attribute)
(panda_guard.role.defenses.goal_priority.GoalPriorityDefenderConfig attribute)
(panda_guard.role.defenses.gradsafe.GradSafeDefenderConfig attribute)
(panda_guard.role.defenses.icl.IclDefenderConfig attribute)
(panda_guard.role.defenses.paraphrase.ParaphraseDefenderConfig attribute)
(panda_guard.role.defenses.perplexity_filter.PerplexityFilterDefenderConfig attribute)
(panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
(panda_guard.role.defenses.rewrite.NoneDefenderConfig attribute)
(panda_guard.role.defenses.rewrite.RewriteDefenderConfig attribute)
(panda_guard.role.defenses.rewrite.SelfReminderDefenderConfig attribute)
(panda_guard.role.defenses.rpo.RPODefenderConfig attribute)
(panda_guard.role.defenses.self_defense.SelfDefenseDefenderConfig attribute)
(panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefenderConfig attribute)
(panda_guard.role.defenses.smoothllm.SmoothLLMDefenderConfig attribute)
defender_config (panda_guard.pipelines.inference.InferPipelineConfig attribute)
defender_name (panda_guard.role.defenses.base.BaseDefenderConfig attribute)
(panda_guard.role.defenses.goal_priority.GoalPriorityDefenderConfig attribute)
(panda_guard.role.defenses.gradsafe.GradSafeDefenderConfig attribute)
(panda_guard.role.defenses.icl.IclDefenderConfig attribute)
(panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
(panda_guard.role.defenses.rewrite.NoneDefenderConfig attribute)
(panda_guard.role.defenses.rpo.RPODefenderConfig attribute)
(panda_guard.role.defenses.self_defense.SelfDefenseDefenderConfig attribute)
defense() (panda_guard.role.defenses.back_translate.BackTranslationDefender method)
(panda_guard.role.defenses.base.BaseDefender method)
(panda_guard.role.defenses.goal_priority.GoalPriorityDefender method)
(panda_guard.role.defenses.gradsafe.GradSafeDefender method)
(panda_guard.role.defenses.icl.IclDefender method)
(panda_guard.role.defenses.paraphrase.ParaphraseDefender method)
(panda_guard.role.defenses.perplexity_filter.PerplexityFilterDefender method)
(panda_guard.role.defenses.repe.RepeDefender method)
(panda_guard.role.defenses.rewrite.NoneDefender method)
(panda_guard.role.defenses.rewrite.RewriteDefender method)
(panda_guard.role.defenses.rpo.RPODefender method)
(panda_guard.role.defenses.self_defense.SelfDefenseDefender method)
(panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefender method)
(panda_guard.role.defenses.smoothllm.SmoothLLMDefender method)
defense_type (panda_guard.role.defenses.goal_priority.GoalPriorityDefenderConfig attribute)
depth (panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
device_map (panda_guard.llms.hf.HuggingFaceLLMConfig attribute)
dict_type (panda_guard.role.attacks.overload.OverloadAttackerConfig attribute)
direction_method (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
display_help() (in module panda_guard.cli.attack)
(in module panda_guard.cli.chat)
display_judge_results() (in module panda_guard.cli.attack)
(in module panda_guard.cli.chat)
(in module panda_guard.cli.inference)
display_token_info() (in module panda_guard.cli.attack)
(in module panda_guard.cli.chat)
(in module panda_guard.cli.inference)
E
early_stop (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
early_stop_threshold (panda_guard.role.attacks.pair.PairAttackerConfig attribute)
embed_inputs() (in module panda_guard.role.attacks.cold_attack.util)
embed_inputs_target() (in module panda_guard.role.attacks.cold_attack.util)
evaluate() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.GPTFuzzer method)
evaluate_log_likelihood() (panda_guard.llms.base.BaseLLM method)
(panda_guard.llms.claude.ClaudeLLM method)
(panda_guard.llms.gemini.GeminiLLM method)
(panda_guard.llms.hf.HuggingFaceLLM method)
(panda_guard.llms.oai.OpenAiChatLLM method)
(panda_guard.llms.oai.OpenAiLLM method)
(panda_guard.llms.vllm_llm.VLLMLLM method)
EXP3SelectPolicy (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection)
expand() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorExpand method)
extract_res() (panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefender method)
F
fill_llms_configs() (in module panda_guard.cli.eval)
filter_ids (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
filter_ids_op() (panda_guard.role.attacks.gcg.GCGAttacker method)
filter_llm_config (panda_guard.role.defenses.perplexity_filter.PerplexityFilterDefenderConfig attribute)
filter_llm_gen_config (panda_guard.role.defenses.perplexity_filter.PerplexityFilterDefenderConfig attribute)
find_executable_batch_size() (panda_guard.role.attacks.gcg.GCGAttacker method)
find_nearest_vectors_pytorch() (in module panda_guard.role.attacks.cold_attack.util)
finish_reason (panda_guard.cli.serve.Choice attribute)
forw() (in module panda_guard.role.attacks.cold_attack.util)
forward() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedBlock method)
(panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
frequency_penalty (panda_guard.cli.serve.ChatCompletionRequest attribute)
fuzzer (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.MutatePolicy property)
G
GCGAttacker (class in panda_guard.role.attacks.gcg)
GCGAttackerConfig (class in panda_guard.role.attacks.gcg)
GeminiLLM (class in panda_guard.llms.gemini)
GeminiLLMConfig (class in panda_guard.llms.gemini)
generate() (panda_guard.llms.base.BaseLLM method)
(panda_guard.llms.claude.ClaudeLLM method)
(panda_guard.llms.gemini.GeminiLLM method)
(panda_guard.llms.hf.HuggingFaceLLM method)
(panda_guard.llms.oai.OpenAiChatLLM method)
(panda_guard.llms.oai.OpenAiLLM method)
(panda_guard.llms.vllm_llm.VLLMLLM method)
(panda_guard.role.defenses.repe.RepeDefender method)
(panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
generate_shuffled_dict() (panda_guard.role.attacks.overload.OverloadAttacker method)
generate_similar() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorGenerateSimilar method)
get_activations() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
get_attack() (panda_guard.role.attacks.tap.TAPAttacker method)
get_attacker_system_prompt() (panda_guard.role.attacks.tap.TAPAttacker method)
get_best_ids() (panda_guard.role.attacks.gcg.AttackBuffer method)
get_component_class() (panda_guard.utils.ComponentRegistry method)
get_corresponding_string() (panda_guard.role.attacks.scav.ScavAttacker method)
get_ctrl_hidden_layers() (panda_guard.role.defenses.repe.RepeDefender method)
get_default_safe_set() (in module panda_guard.role.defenses.gradsafe)
get_default_unsafe_set() (in module panda_guard.role.defenses.gradsafe)
get_directions() (panda_guard.role.defenses.repe_utils.rep_reading_pipeline.RepReadingPipeline method)
get_fixed_args() (in module panda_guard.role.attacks.renellm_attack.renellm)
get_gpt_ppl() (in module panda_guard.role.attacks.cold_attack.util)
get_gpu_memory_usage() (in module panda_guard.utils)
get_highest_loss() (panda_guard.role.attacks.gcg.AttackBuffer method)
get_init_msg() (panda_guard.role.attacks.tap.TAPAttacker static method)
get_input_files() (in module panda_guard.cli.eval)
get_logits() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
get_lowest_loss() (panda_guard.role.attacks.gcg.AttackBuffer method)
get_nonascii_toks() (panda_guard.role.attacks.gcg.GCGAttacker method)
get_package_config_path() (in module panda_guard.cli.attack)
(in module panda_guard.cli.chat)
(in module panda_guard.cli.eval)
(in module panda_guard.cli.inference)
(in module panda_guard.cli.serve)
get_ref_embedding() (in module panda_guard.role.attacks.cold_attack.util)
get_rep_directions() (panda_guard.role.defenses.repe_utils.rep_readers.ClusterMeanRepReader method)
(panda_guard.role.defenses.repe_utils.rep_readers.PCARepReader method)
(panda_guard.role.defenses.repe_utils.rep_readers.RandomRepReader method)
(panda_guard.role.defenses.repe_utils.rep_readers.RepReader method)
get_signs() (panda_guard.role.defenses.repe_utils.rep_readers.PCARepReader method)
(panda_guard.role.defenses.repe_utils.rep_readers.RepReader method)
get_target_llm_loss() (panda_guard.role.defenses.gradsafe.GradSafeDefender method)
get_text_from_logits() (in module panda_guard.role.attacks.cold_attack.util)
get_text_from_logits_topk() (in module panda_guard.role.attacks.cold_attack.util)
GoalPriorityDefender (class in panda_guard.role.defenses.goal_priority)
GoalPriorityDefenderConfig (class in panda_guard.role.defenses.goal_priority)
GPT4CipherAttacker (class in panda_guard.role.attacks.gpt4_cipher)
GPT4CipherAttackerConfig (class in panda_guard.role.attacks.gpt4_cipher)
GPTFuzzAttacker (class in panda_guard.role.attacks.gptfuzzer_attack.gptfuzz)
GPTFuzzAttackerConfig (class in panda_guard.role.attacks.gptfuzzer_attack.gptfuzz)
GPTFuzzer (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core)
gpu_memory_utilization (panda_guard.llms.vllm_llm.VLLMLLMConfig attribute)
GradSafeDefender (class in panda_guard.role.defenses.gradsafe)
GradSafeDefenderConfig (class in panda_guard.role.defenses.gradsafe)
H
has_repeat() (in module panda_guard.role.attacks.cold_attack.util)
HuggingFaceLLM (class in panda_guard.llms.hf)
HuggingFaceLLMConfig (class in panda_guard.llms.hf)
I
IcaAttacker (class in panda_guard.role.attacks.ica)
IcaAttackerConfig (class in panda_guard.role.attacks.ica)
IclDefender (class in panda_guard.role.defenses.icl)
IclDefenderConfig (class in panda_guard.role.defenses.icl)
id (panda_guard.cli.serve.ChatCompletionResponse attribute)
(panda_guard.cli.serve.ModelData attribute)
in_context_prompt (panda_guard.role.defenses.icl.IclDefenderConfig attribute)
index (panda_guard.cli.serve.Choice attribute)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.PromptNode property)
infer_llm_config (panda_guard.role.defenses.back_translate.BackTranslationDefenderConfig attribute)
infer_llm_gen_config (panda_guard.role.defenses.back_translate.BackTranslationDefenderConfig attribute)
InferPipeline (class in panda_guard.pipelines.inference)
InferPipelineConfig (class in panda_guard.pipelines.inference)
init_adv_suffix() (in module panda_guard.role.attacks.random_search)
init_buffer() (panda_guard.role.attacks.gcg.GCGAttacker method)
initial_seed (panda_guard.role.attacks.gptfuzzer_attack.gptfuzz.GPTFuzzAttackerConfig attribute)
initialize() (in module panda_guard.role.attacks.cold_attack.util)
is_assistant_turn() (in module panda_guard.utils)
is_iterator() (in module panda_guard.cli.attack)
(in module panda_guard.cli.chat)
(in module panda_guard.cli.eval)
(in module panda_guard.cli.inference)
is_stop() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.GPTFuzzer method)
is_user_turn() (in module panda_guard.utils)
is_wrapped() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
J
judge() (panda_guard.role.judges.base.BaseJudge method)
(panda_guard.role.judges.llm_based.LMMJudge method)
(panda_guard.role.judges.llm_based.TAPLLMJudge method)
(panda_guard.role.judges.rule_based.RuleBasedJudge method)
judge_cls (panda_guard.role.judges.base.BaseJudgeConfig attribute)
(panda_guard.role.judges.llm_based.LMMJudgeConfig attribute)
(panda_guard.role.judges.llm_based.TAPLLMJudgeConfig attribute)
(panda_guard.role.judges.rule_based.RuleBasedJudgeConfig attribute)
judge_config (panda_guard.role.defenses.self_defense.SelfDefenseDefenderConfig attribute)
judge_configs (panda_guard.pipelines.inference.InferPipelineConfig attribute)
judge_llm_config (panda_guard.role.attacks.renellm_attack.renellm.ReNeLLMAttackerConfig attribute)
(panda_guard.role.judges.llm_based.LMMJudgeConfig attribute)
(panda_guard.role.judges.llm_based.TAPLLMJudgeConfig attribute)
judge_llm_gen_config (panda_guard.role.attacks.renellm_attack.renellm.ReNeLLMAttackerConfig attribute)
(panda_guard.role.judges.llm_based.LMMJudgeConfig attribute)
(panda_guard.role.judges.llm_based.TAPLLMJudgeConfig attribute)
judge_name (panda_guard.role.judges.base.BaseJudgeConfig attribute)
(panda_guard.role.judges.llm_based.LMMJudgeConfig attribute)
(panda_guard.role.judges.llm_based.PairLLMJudgeConfig attribute)
(panda_guard.role.judges.llm_based.TAPLLMJudgeConfig attribute)
(panda_guard.role.judges.rule_based.RuleBasedJudgeConfig attribute)
judge_prefix_set() (in module panda_guard.role.attacks.random_search)
judge_score() (panda_guard.role.attacks.tap.TAPAttacker method)
(panda_guard.role.judges.llm_based.TAPLLMJudge method)
judge_score_threshold (panda_guard.role.defenses.self_defense.SelfDefenseDefenderConfig attribute)
judge_topic() (panda_guard.role.judges.llm_based.TAPLLMJudge method)
L
layer_number (panda_guard.role.attacks.deepinception.DeepInceptionAttackerConfig attribute)
lenmax (panda_guard.role.attacks.overload.OverloadAttackerConfig attribute)
lenmin (panda_guard.role.attacks.overload.OverloadAttackerConfig attribute)
llm_config (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
(panda_guard.role.attacks.rewrite.RewriteAttackerConfig attribute)
llm_gen_config (panda_guard.role.attacks.art_prompt.ArtPromptAttackerConfig attribute)
(panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
(panda_guard.role.attacks.rewrite.RewriteAttackerConfig attribute)
llm_register() (in module panda_guard.pipelines.inference)
llm_type (panda_guard.llms.base.BaseLLMConfig attribute)
(panda_guard.llms.claude.ClaudeLLMConfig attribute)
(panda_guard.llms.gemini.GeminiLLMConfig attribute)
(panda_guard.llms.hf.HuggingFaceLLMConfig attribute)
(panda_guard.llms.oai.OpenAiChatLLMConfig attribute)
(panda_guard.llms.oai.OpenAiLLMConfig attribute)
(panda_guard.llms.vllm_llm.VLLMLLMConfig attribute)
LLMGenerateConfig (class in panda_guard.llms.base)
LMMJudge (class in panda_guard.role.judges.llm_based)
LMMJudgeConfig (class in panda_guard.role.judges.llm_based)
load_class() (in module panda_guard.utils)
load_csv() (panda_guard.role.attacks.scav.ScavAttacker method)
load_json_files_from_yaml() (in module panda_guard.cli.eval)
load_yaml() (in module panda_guard.cli.attack)
(in module panda_guard.cli.chat)
(in module panda_guard.cli.eval)
(in module panda_guard.cli.inference)
(in module panda_guard.cli.serve)
(in module panda_guard.utils)
log() (panda_guard.pipelines.inference.InferPipeline method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.GPTFuzzer method)
(panda_guard.role.attacks.pair.PairAttacker method)
(panda_guard.role.defenses.gradsafe.GradSafeDefender method)
logical_appeal_prompt() (in module panda_guard.role.attacks.pair)
logprob_threshold (panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
logprobs (panda_guard.llms.base.LLMGenerateConfig attribute)
M
main() (in module panda_guard.cli.main)
mask_llm_url (panda_guard.role.attacks.art_prompt.ArtPromptAttackerConfig attribute)
mask_loc (panda_guard.role.attacks.overload.OverloadAttackerConfig attribute)
max_iterations (panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
max_model_len (panda_guard.llms.vllm_llm.VLLMLLMConfig attribute)
max_n_to_change (panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
max_n_tokens (panda_guard.llms.base.LLMGenerateConfig attribute)
max_restarts (panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
max_tokens (panda_guard.cli.serve.ChatCompletionRequest attribute)
max_tokens_to_sample (panda_guard.llms.claude.ClaudeLLMConfig attribute)
MCTSExploreSelectPolicy (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection)
mellowmax() (panda_guard.role.attacks.gcg.GCGAttacker method)
mellowmax_alpha (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
message (panda_guard.cli.serve.Choice attribute)
messages (panda_guard.cli.serve.ChatCompletionRequest attribute)
model (panda_guard.cli.serve.ChatCompletionRequest attribute)
(panda_guard.cli.serve.ChatCompletionResponse attribute)
model_config (panda_guard.cli.serve.ChatCompletionRequest attribute)
(panda_guard.cli.serve.ChatCompletionResponse attribute)
(panda_guard.cli.serve.Choice attribute)
(panda_guard.cli.serve.ModelData attribute)
(panda_guard.cli.serve.ModelsResponse attribute)
model_name (panda_guard.llms.base.BaseLLMConfig attribute)
(panda_guard.llms.claude.ClaudeLLMConfig attribute)
(panda_guard.llms.gemini.GeminiLLMConfig attribute)
(panda_guard.llms.hf.HuggingFaceLLMConfig attribute)
(panda_guard.llms.oai.OpenAiChatLLMConfig attribute)
(panda_guard.llms.oai.OpenAiLLMConfig attribute)
(panda_guard.llms.vllm_llm.VLLMLLMConfig attribute)
ModelData (class in panda_guard.cli.serve)
ModelsResponse (class in panda_guard.cli.serve)
module
panda_guard
panda_guard.cli
panda_guard.cli.attack
panda_guard.cli.chat
panda_guard.cli.eval
panda_guard.cli.inference
panda_guard.cli.main
panda_guard.cli.serve
panda_guard.llms
panda_guard.llms.base
panda_guard.llms.claude
panda_guard.llms.gemini
panda_guard.llms.hf
panda_guard.llms.oai
panda_guard.llms.vllm_llm
panda_guard.pipelines
panda_guard.pipelines.inference
panda_guard.role
panda_guard.role.attacks
panda_guard.role.attacks.art_prompt
panda_guard.role.attacks.base
panda_guard.role.attacks.cold_attack.bleuloss
panda_guard.role.attacks.cold_attack.util
panda_guard.role.attacks.deepinception
panda_guard.role.attacks.gcg
panda_guard.role.attacks.gpt4_cipher
panda_guard.role.attacks.gptfuzzer_attack
panda_guard.role.attacks.gptfuzzer_attack.fuzzer
panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core
panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator
panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection
panda_guard.role.attacks.gptfuzzer_attack.gptfuzz
panda_guard.role.attacks.gptfuzzer_attack.utils
panda_guard.role.attacks.gptfuzzer_attack.utils.predict
panda_guard.role.attacks.gptfuzzer_attack.utils.template
panda_guard.role.attacks.ica
panda_guard.role.attacks.overload
panda_guard.role.attacks.pair
panda_guard.role.attacks.random_search
panda_guard.role.attacks.renellm_attack
panda_guard.role.attacks.renellm_attack.renellm
panda_guard.role.attacks.rewrite
panda_guard.role.attacks.scav
panda_guard.role.attacks.tap
panda_guard.role.attacks.transfer
panda_guard.role.defenses
panda_guard.role.defenses.back_translate
panda_guard.role.defenses.base
panda_guard.role.defenses.goal_priority
panda_guard.role.defenses.gradsafe
panda_guard.role.defenses.icl
panda_guard.role.defenses.paraphrase
panda_guard.role.defenses.perplexity_filter
panda_guard.role.defenses.repe
panda_guard.role.defenses.repe_utils
panda_guard.role.defenses.repe_utils.pipelines
panda_guard.role.defenses.repe_utils.rep_control_pipeline
panda_guard.role.defenses.repe_utils.rep_control_reading_vec
panda_guard.role.defenses.repe_utils.rep_readers
panda_guard.role.defenses.repe_utils.rep_reading_pipeline
panda_guard.role.defenses.rewrite
panda_guard.role.defenses.rpo
panda_guard.role.defenses.self_defense
panda_guard.role.defenses.semantic_smoothllm
panda_guard.role.defenses.smoothllm
panda_guard.role.judges
panda_guard.role.judges.base
panda_guard.role.judges.judge_registry
panda_guard.role.judges.llm_based
panda_guard.role.judges.rule_based
panda_guard.utils
mutate_batch() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.MutatePolicy method)
mutate_single() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.MutatePolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.MutateRandomSinglePolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.Mutator method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorBase method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorCrossOver method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorExpand method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorGenerateSimilar method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorRephrase method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorShorten method)
MutatePolicy (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator)
MutateRandomSinglePolicy (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator)
Mutator (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator)
N
n (panda_guard.cli.serve.ChatCompletionRequest attribute)
n_components (panda_guard.role.defenses.repe_utils.rep_readers.ClusterMeanRepReader attribute)
n_iterations (panda_guard.role.attacks.pair.PairAttackerConfig attribute)
n_replace (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
needs_hiddens (panda_guard.role.defenses.repe_utils.rep_readers.ClusterMeanRepReader attribute)
(panda_guard.role.defenses.repe_utils.rep_readers.PCARepReader attribute)
NoneAttacker (class in panda_guard.role.attacks.transfer)
NoneAttackerConfig (class in panda_guard.role.attacks.transfer)
NoneDefender (class in panda_guard.role.defenses.rewrite)
NoneDefenderConfig (class in panda_guard.role.defenses.rewrite)
num_jailbreak (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.PromptNode property)
num_perturbations (panda_guard.role.defenses.smoothllm.SmoothLLMDefenderConfig attribute)
num_query (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.PromptNode property)
num_reject (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.PromptNode property)
num_samples (panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefenderConfig attribute)
num_steps (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
O
object (panda_guard.cli.serve.ChatCompletionResponse attribute)
(panda_guard.cli.serve.ModelData attribute)
(panda_guard.cli.serve.ModelsResponse attribute)
on_topic_score() (panda_guard.role.attacks.tap.TAPAttacker method)
one_hot() (in module panda_guard.role.attacks.cold_attack.util)
OpenAiChatLLM (class in panda_guard.llms.oai)
OpenAiChatLLMConfig (class in panda_guard.llms.oai)
OpenAiLLM (class in panda_guard.llms.oai)
OpenAiLLMConfig (class in panda_guard.llms.oai)
OpenAIMutatorBase (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator)
OpenAIMutatorCrossOver (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator)
OpenAIMutatorExpand (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator)
OpenAIMutatorGenerateSimilar (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator)
OpenAIMutatorRephrase (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator)
OpenAIMutatorShorten (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator)
optimzed_file_70b (panda_guard.role.attacks.scav.ScavAttackerConfig attribute)
optimzed_file_8b (panda_guard.role.attacks.scav.ScavAttackerConfig attribute)
overload_generate() (panda_guard.role.attacks.overload.OverloadAttacker method)
OverloadAttacker (class in panda_guard.role.attacks.overload)
OverloadAttackerConfig (class in panda_guard.role.attacks.overload)
override_config() (in module panda_guard.cli.eval)
owned_by (panda_guard.cli.serve.ModelData attribute)
P
pair_judge (panda_guard.role.attacks.pair.PairAttackerConfig attribute)
PairAttacker (class in panda_guard.role.attacks.pair)
PairAttackerConfig (class in panda_guard.role.attacks.pair)
PairLLMJudge (class in panda_guard.role.judges.llm_based)
PairLLMJudgeConfig (class in panda_guard.role.judges.llm_based)
panda_guard
module
panda_guard.cli
module
panda_guard.cli.attack
module
panda_guard.cli.chat
module
panda_guard.cli.eval
module
panda_guard.cli.inference
module
panda_guard.cli.main
module
panda_guard.cli.serve
module
panda_guard.llms
module
panda_guard.llms.base
module
panda_guard.llms.claude
module
panda_guard.llms.gemini
module
panda_guard.llms.hf
module
panda_guard.llms.oai
module
panda_guard.llms.vllm_llm
module
panda_guard.pipelines
module
panda_guard.pipelines.inference
module
panda_guard.role
module
panda_guard.role.attacks
module
panda_guard.role.attacks.art_prompt
module
panda_guard.role.attacks.base
module
panda_guard.role.attacks.cold_attack.bleuloss
module
panda_guard.role.attacks.cold_attack.util
module
panda_guard.role.attacks.deepinception
module
panda_guard.role.attacks.gcg
module
panda_guard.role.attacks.gpt4_cipher
module
panda_guard.role.attacks.gptfuzzer_attack
module
panda_guard.role.attacks.gptfuzzer_attack.fuzzer
module
panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core
module
panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator
module
panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection
module
panda_guard.role.attacks.gptfuzzer_attack.gptfuzz
module
panda_guard.role.attacks.gptfuzzer_attack.utils
module
panda_guard.role.attacks.gptfuzzer_attack.utils.predict
module
panda_guard.role.attacks.gptfuzzer_attack.utils.template
module
panda_guard.role.attacks.ica
module
panda_guard.role.attacks.overload
module
panda_guard.role.attacks.pair
module
panda_guard.role.attacks.random_search
module
panda_guard.role.attacks.renellm_attack
module
panda_guard.role.attacks.renellm_attack.renellm
module
panda_guard.role.attacks.rewrite
module
panda_guard.role.attacks.scav
module
panda_guard.role.attacks.tap
module
panda_guard.role.attacks.transfer
module
panda_guard.role.defenses
module
panda_guard.role.defenses.back_translate
module
panda_guard.role.defenses.base
module
panda_guard.role.defenses.goal_priority
module
panda_guard.role.defenses.gradsafe
module
panda_guard.role.defenses.icl
module
panda_guard.role.defenses.paraphrase
module
panda_guard.role.defenses.perplexity_filter
module
panda_guard.role.defenses.repe
module
panda_guard.role.defenses.repe_utils
module
panda_guard.role.defenses.repe_utils.pipelines
module
panda_guard.role.defenses.repe_utils.rep_control_pipeline
module
panda_guard.role.defenses.repe_utils.rep_control_reading_vec
module
panda_guard.role.defenses.repe_utils.rep_readers
module
panda_guard.role.defenses.repe_utils.rep_reading_pipeline
module
panda_guard.role.defenses.rewrite
module
panda_guard.role.defenses.rpo
module
panda_guard.role.defenses.self_defense
module
panda_guard.role.defenses.semantic_smoothllm
module
panda_guard.role.defenses.smoothllm
module
panda_guard.role.judges
module
panda_guard.role.judges.base
module
panda_guard.role.judges.judge_registry
module
panda_guard.role.judges.llm_based
module
panda_guard.role.judges.rule_based
module
panda_guard.utils
module
parallel_judging() (panda_guard.pipelines.inference.InferPipeline method)
paraphrase_llm_config (panda_guard.role.defenses.paraphrase.ParaphraseDefenderConfig attribute)
paraphrase_llm_gen_config (panda_guard.role.defenses.paraphrase.ParaphraseDefenderConfig attribute)
paraphrase_prompt (panda_guard.role.defenses.paraphrase.ParaphraseDefenderConfig attribute)
ParaphraseDefender (class in panda_guard.role.defenses.paraphrase)
ParaphraseDefenderConfig (class in panda_guard.role.defenses.paraphrase)
parse() (panda_guard.role.attacks.art_prompt.ArtPromptAttacker method)
parse_configs_from_dict() (in module panda_guard.utils)
parse_nested_config() (in module panda_guard.utils)
PCARepReader (class in panda_guard.role.defenses.repe_utils.rep_readers)
PerplexityFilterDefender (class in panda_guard.role.defenses.perplexity_filter)
PerplexityFilterDefenderConfig (class in panda_guard.role.defenses.perplexity_filter)
perturb() (panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefender method)
perturb_with_llm() (panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefender method)
perturbation_llm_config (panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefenderConfig attribute)
perturbation_llm_gen_config (panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefenderConfig attribute)
perturbation_ratio (panda_guard.role.defenses.smoothllm.SmoothLLMDefenderConfig attribute)
perturbation_type (panda_guard.role.defenses.semantic_smoothllm.SemanticSmoothLLMDefenderConfig attribute)
(panda_guard.role.defenses.smoothllm.SmoothLLMDefenderConfig attribute)
post_process() (in module panda_guard.role.attacks.cold_attack.util)
post_sent() (in module panda_guard.role.attacks.cold_attack.util)
postprocess() (panda_guard.role.defenses.repe_utils.rep_reading_pipeline.RepReadingPipeline method)
pre_filter() (in module panda_guard.role.attacks.cold_attack.util)
predict() (panda_guard.role.attacks.gptfuzzer_attack.utils.predict.Predictor method)
(panda_guard.role.attacks.gptfuzzer_attack.utils.predict.RoBERTaPredictor method)
predict_model (panda_guard.role.attacks.gptfuzzer_attack.gptfuzz.GPTFuzzAttackerConfig attribute)
Predictor (class in panda_guard.role.attacks.gptfuzzer_attack.utils.predict)
preprocess() (panda_guard.role.defenses.repe_utils.rep_reading_pipeline.RepReadingPipeline method)
preprocess_dataset() (panda_guard.role.defenses.repe.RepeDefender method)
presence_penalty (panda_guard.cli.serve.ChatCompletionRequest attribute)
print_conv() (in module panda_guard.role.attacks.pair)
print_topk_stats() (in module panda_guard.role.attacks.cold_attack.util)
process_end_eos() (in module panda_guard.utils)
process_file() (in module panda_guard.cli.eval)
process_target_response() (panda_guard.role.attacks.tap.TAPAttacker static method)
project_onto_direction() (in module panda_guard.role.defenses.repe_utils.rep_readers)
prompt_template (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
(panda_guard.role.defenses.rewrite.RewriteDefenderConfig attribute)
(panda_guard.role.defenses.rewrite.SelfReminderDefenderConfig attribute)
PromptNode (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core)
prune() (panda_guard.role.attacks.tap.TAPAttacker method)
Q
quantization (panda_guard.llms.vllm_llm.VLLMLLMConfig attribute)
R
random_dict (panda_guard.role.attacks.overload.OverloadAttackerConfig attribute)
random_modify_tokens() (panda_guard.role.attacks.random_search.RandomSearchAttacker method)
RandomRepReader (class in panda_guard.role.defenses.repe_utils.rep_readers)
RandomSearchAttacker (class in panda_guard.role.attacks.random_search)
RandomSearchAttackerConfig (class in panda_guard.role.attacks.random_search)
RandomSelectPolicy (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection)
rank_and_filter() (in module panda_guard.role.attacks.cold_attack.util)
rank_generations() (in module panda_guard.role.attacks.cold_attack.util)
recenter() (in module panda_guard.role.defenses.repe_utils.rep_readers)
register_judge() (in module panda_guard.role.judges.judge_registry)
ReNeLLMAttacker (class in panda_guard.role.attacks.renellm_attack.renellm)
ReNeLLMAttackerConfig (class in panda_guard.role.attacks.renellm_attack.renellm)
rep_token (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
RepControlPipeline (class in panda_guard.role.defenses.repe_utils.rep_control_pipeline)
repe_pipeline_registry() (in module panda_guard.role.defenses.repe_utils.pipelines)
RepeDefender (class in panda_guard.role.defenses.repe)
RepeDefenderConfig (class in panda_guard.role.defenses.repe)
rephrase() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorRephrase method)
RepReader (class in panda_guard.role.defenses.repe_utils.rep_readers)
RepReadingPipeline (class in panda_guard.role.defenses.repe_utils.rep_reading_pipeline)
reset() (panda_guard.llms.base.BaseLLM method)
(panda_guard.pipelines.inference.InferPipeline method)
(panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedBlock method)
(panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
response() (panda_guard.role.defenses.gradsafe.GradSafeDefender method)
(panda_guard.role.defenses.self_defense.SelfDefenseDefender method)
response_rules (panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
response_rules() (in module panda_guard.role.attacks.random_search)
return_new_response_anyway (panda_guard.role.defenses.back_translate.BackTranslationDefenderConfig attribute)
rewrite() (panda_guard.role.attacks.rewrite.RewriteAttacker method)
rewrite_llm_config (panda_guard.role.attacks.renellm_attack.renellm.ReNeLLMAttackerConfig attribute)
rewrite_llm_gen_config (panda_guard.role.attacks.renellm_attack.renellm.ReNeLLMAttackerConfig attribute)
rewrite_template (panda_guard.role.attacks.art_prompt.ArtPromptAttackerConfig attribute)
(panda_guard.role.attacks.gpt4_cipher.GPT4CipherAttackerConfig attribute)
(panda_guard.role.attacks.rewrite.RewriteAttackerConfig attribute)
RewriteAttacker (class in panda_guard.role.attacks.rewrite)
RewriteAttackerConfig (class in panda_guard.role.attacks.rewrite)
RewriteDefender (class in panda_guard.role.defenses.rewrite)
RewriteDefenderConfig (class in panda_guard.role.defenses.rewrite)
RoBERTaPredictor (class in panda_guard.role.attacks.gptfuzzer_attack.utils.predict)
roleplaying_prompt() (in module panda_guard.role.attacks.pair)
RoundRobinSelectPolicy (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection)
RPODefender (class in panda_guard.role.defenses.rpo)
RPODefenderConfig (class in panda_guard.role.defenses.rpo)
rule_based_judge() (in module panda_guard.role.attacks.random_search)
RuleBasedJudge (class in panda_guard.role.judges.rule_based)
RuleBasedJudgeConfig (class in panda_guard.role.judges.rule_based)
run() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.GPTFuzzer method)
run_inference() (in module panda_guard.cli.eval)
run_prompt() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
S
safe_set (panda_guard.role.defenses.gradsafe.GradSafeDefenderConfig attribute)
safety_settings (panda_guard.llms.gemini.GeminiLLMConfig attribute)
sample_ids_from_grad() (panda_guard.role.attacks.gcg.GCGAttacker method)
ScavAttacker (class in panda_guard.role.attacks.scav)
ScavAttackerConfig (class in panda_guard.role.attacks.scav)
scence (panda_guard.role.attacks.deepinception.DeepInceptionAttackerConfig attribute)
schedule_n_to_change_fixed() (in module panda_guard.role.attacks.random_search)
score_by_bert() (in module panda_guard.role.attacks.cold_attack.util)
search_width (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
seed (panda_guard.llms.base.LLMGenerateConfig attribute)
(panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
select() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.EXP3SelectPolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.MCTSExploreSelectPolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.RandomSelectPolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.RoundRobinSelectPolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.SelectPolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.UCBSelectPolicy method)
selector (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
SelectPolicy (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection)
SelfDefenseDefender (class in panda_guard.role.defenses.self_defense)
SelfDefenseDefenderConfig (class in panda_guard.role.defenses.self_defense)
SelfReminderDefender (class in panda_guard.role.defenses.rewrite)
SelfReminderDefenderConfig (class in panda_guard.role.defenses.rewrite)
SemanticSmoothLLMDefender (class in panda_guard.role.defenses.semantic_smoothllm)
SemanticSmoothLLMDefenderConfig (class in panda_guard.role.defenses.semantic_smoothllm)
sentence_completion() (in module panda_guard.role.attacks.cold_attack.util)
set_activations() (panda_guard.role.defenses.repe.RepeDefender method)
set_controller() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedBlock method)
(panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
set_masks() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedBlock method)
(panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
setup() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.GPTFuzzer method)
shorten() (panda_guard.role.attacks.gptfuzzer_attack.fuzzer.mutator.OpenAIMutatorShorten method)
should_reduce_batch_size() (panda_guard.role.attacks.gcg.GCGAttacker method)
sim_score() (in module panda_guard.role.attacks.cold_attack.util)
SmoothLLMDefender (class in panda_guard.role.defenses.smoothllm)
SmoothLLMDefenderConfig (class in panda_guard.role.defenses.smoothllm)
soft_backward() (in module panda_guard.role.attacks.cold_attack.util)
soft_backward_loss() (in module panda_guard.role.attacks.cold_attack.util)
soft_backward_steps() (in module panda_guard.role.attacks.cold_attack.util)
soft_distance() (in module panda_guard.role.attacks.cold_attack.util)
soft_forward() (in module panda_guard.role.attacks.cold_attack.util)
soft_forward_loss() (in module panda_guard.role.attacks.cold_attack.util)
soft_forward_xyz() (in module panda_guard.role.attacks.cold_attack.util)
soft_forward_xyz_target() (in module panda_guard.role.attacks.cold_attack.util)
soft_nll() (in module panda_guard.role.attacks.cold_attack.util)
soft_nll_detach() (in module panda_guard.role.attacks.cold_attack.util)
start() (in module panda_guard.cli.attack)
(in module panda_guard.cli.chat)
(in module panda_guard.cli.eval)
(in module panda_guard.cli.inference)
(in module panda_guard.cli.serve)
stream (panda_guard.cli.serve.ChatCompletionRequest attribute)
(panda_guard.llms.base.LLMGenerateConfig attribute)
strlen (panda_guard.role.attacks.overload.OverloadAttackerConfig attribute)
synthesis_message() (in module panda_guard.role.attacks.gptfuzzer_attack.utils.template)
system_template (panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
(panda_guard.role.defenses.rewrite.RewriteDefenderConfig attribute)
(panda_guard.role.defenses.rewrite.SelfReminderDefenderConfig attribute)
(panda_guard.role.judges.llm_based.LMMJudgeConfig attribute)
(panda_guard.role.judges.llm_based.PairLLMJudgeConfig attribute)
system_template_score (panda_guard.role.judges.llm_based.TAPLLMJudgeConfig attribute)
system_template_topic (panda_guard.role.judges.llm_based.TAPLLMJudgeConfig attribute)
T
tap_judge_config (panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
TAPAttacker (class in panda_guard.role.attacks.tap)
TAPAttackerConfig (class in panda_guard.role.attacks.tap)
TAPLLMJudge (class in panda_guard.role.judges.llm_based)
TAPLLMJudgeConfig (class in panda_guard.role.judges.llm_based)
target_llm_config (panda_guard.role.attacks.gptfuzzer_attack.gptfuzz.GPTFuzzAttackerConfig attribute)
(panda_guard.role.attacks.pair.PairAttackerConfig attribute)
(panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
(panda_guard.role.attacks.renellm_attack.renellm.ReNeLLMAttackerConfig attribute)
(panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
(panda_guard.role.defenses.base.BaseDefenderConfig attribute)
(panda_guard.role.defenses.goal_priority.GoalPriorityDefenderConfig attribute)
(panda_guard.role.defenses.gradsafe.GradSafeDefenderConfig attribute)
(panda_guard.role.defenses.rpo.RPODefenderConfig attribute)
(panda_guard.role.defenses.self_defense.SelfDefenseDefenderConfig attribute)
target_llm_gen_config (panda_guard.role.attacks.gptfuzzer_attack.gptfuzz.GPTFuzzAttackerConfig attribute)
(panda_guard.role.attacks.pair.PairAttackerConfig attribute)
(panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
(panda_guard.role.attacks.renellm_attack.renellm.ReNeLLMAttackerConfig attribute)
(panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
(panda_guard.role.defenses.base.BaseDefenderConfig attribute)
(panda_guard.role.defenses.goal_priority.GoalPriorityDefenderConfig attribute)
(panda_guard.role.defenses.gradsafe.GradSafeDefenderConfig attribute)
(panda_guard.role.defenses.rpo.RPODefenderConfig attribute)
(panda_guard.role.defenses.self_defense.SelfDefenseDefenderConfig attribute)
target_llm_name (panda_guard.role.attacks.scav.ScavAttackerConfig attribute)
target_llm_response() (panda_guard.role.attacks.tap.TAPAttacker method)
target_str (panda_guard.role.attacks.pair.PairAttackerConfig attribute)
(panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
(panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
temperature (panda_guard.cli.serve.ChatCompletionRequest attribute)
(panda_guard.llms.base.LLMGenerateConfig attribute)
tensor_parallel_size (panda_guard.llms.vllm_llm.VLLMLLMConfig attribute)
threshold (panda_guard.role.defenses.back_translate.BackTranslationDefenderConfig attribute)
(panda_guard.role.defenses.perplexity_filter.PerplexityFilterDefenderConfig attribute)
top_k_filter() (in module panda_guard.role.attacks.cold_attack.util)
top_k_filter_3d() (in module panda_guard.role.attacks.cold_attack.util)
top_p (panda_guard.cli.serve.ChatCompletionRequest attribute)
top_p() (in module panda_guard.role.attacks.cold_attack.util)
topk (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
(panda_guard.role.defenses.repe.RepeDefenderConfig attribute)
total_tokens (panda_guard.llms.base.BaseLLM property)
TransferAttacker (class in panda_guard.role.attacks.transfer)
TransferAttackerConfig (class in panda_guard.role.attacks.transfer)
transform() (panda_guard.role.defenses.repe_utils.rep_readers.RepReader method)
trust_remote_code (panda_guard.llms.vllm_llm.VLLMLLMConfig attribute)
U
UCBSelectPolicy (class in panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection)
unsafe_set (panda_guard.role.defenses.gradsafe.GradSafeDefenderConfig attribute)
unsafe_threshold (panda_guard.role.defenses.gradsafe.GradSafeDefenderConfig attribute)
unwrap() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
update() (panda_guard.llms.base.BaseLLM method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.core.GPTFuzzer method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.EXP3SelectPolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.MCTSExploreSelectPolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.RoundRobinSelectPolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.SelectPolicy method)
(panda_guard.role.attacks.gptfuzzer_attack.fuzzer.selection.UCBSelectPolicy method)
usage (panda_guard.cli.serve.ChatCompletionResponse attribute)
use_mellowmax (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
use_prefix_cache (panda_guard.role.attacks.gcg.GCGAttackerConfig attribute)
user (panda_guard.cli.serve.ChatCompletionRequest attribute)
user_init_msg (panda_guard.role.attacks.pair.PairAttackerConfig attribute)
user_msg_temp (panda_guard.role.attacks.pair.PairAttackerConfig attribute)
user_template (panda_guard.role.judges.llm_based.LMMJudgeConfig attribute)
(panda_guard.role.judges.llm_based.PairLLMJudgeConfig attribute)
user_template_score (panda_guard.role.judges.llm_based.TAPLLMJudgeConfig attribute)
user_template_topic (panda_guard.role.judges.llm_based.TAPLLMJudgeConfig attribute)
V
value_len (panda_guard.role.attacks.overload.OverloadAttackerConfig attribute)
verbose (panda_guard.role.attacks.pair.PairAttackerConfig attribute)
(panda_guard.role.attacks.random_search.RandomSearchAttackerConfig attribute)
(panda_guard.role.defenses.gradsafe.GradSafeDefenderConfig attribute)
version_callback() (in module panda_guard.cli.main)
VLLMLLM (class in panda_guard.llms.vllm_llm)
VLLMLLMConfig (class in panda_guard.llms.vllm_llm)
vocab_prune() (in module panda_guard.role.attacks.cold_attack.util)
W
wait_for_gpu_memory() (in module panda_guard.utils)
width (panda_guard.role.attacks.tap.TAPAttackerConfig attribute)
wrap() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
wrap_all() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
wrap_block() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
wrap_decoder_block() (panda_guard.role.defenses.repe_utils.rep_control_reading_vec.WrappedReadingVecModel method)
WrappedBlock (class in panda_guard.role.defenses.repe_utils.rep_control_reading_vec)
WrappedReadingVecModel (class in panda_guard.role.defenses.repe_utils.rep_control_reading_vec)
write_json_lines() (in module panda_guard.role.attacks.cold_attack.util)