marin-community
diff --git a/‎.agents/logbooks/alignment_function.md‎
Lines changed: 611 additions & 0 deletions b/‎.agents/logbooks/alignment_function.md‎
Lines changed: 611 additions & 0 deletions
diff --git a/‎experiments/align_debug_vllm_70b_mixtral_rejected_opposite.py‎
Lines changed: 109 additions & 0 deletions b/‎experiments/align_debug_vllm_70b_mixtral_rejected_opposite.py‎
Lines changed: 109 additions & 0 deletions
diff --git a/‎experiments/align_debug_vllm_70b_mixtral_rejected_opposite_metrics.py‎
Lines changed: 104 additions & 0 deletions b/‎experiments/align_debug_vllm_70b_mixtral_rejected_opposite_metrics.py‎
Lines changed: 104 additions & 0 deletions
diff --git a/‎experiments/generate_rejected_opposite_llama_3_3_70b_existing_prompts.py‎
Lines changed: 84 additions & 0 deletions b/‎experiments/generate_rejected_opposite_llama_3_3_70b_existing_prompts.py‎
Lines changed: 84 additions & 0 deletions
diff --git a/‎experiments/generate_responses_llama_3_3_70b_existing_prompts.py‎
Lines changed: 8 additions & 2 deletions b/‎experiments/generate_responses_llama_3_3_70b_existing_prompts.py‎
Lines changed: 8 additions & 2 deletions
diff --git a/‎experiments/generate_responses_llama_3_3_70b_existing_prompts_refactored.py‎
Lines changed: 8 additions & 2 deletions b/‎experiments/generate_responses_llama_3_3_70b_existing_prompts_refactored.py‎
Lines changed: 8 additions & 2 deletions
diff --git a/‎experiments/generate_responses_llama_3_3_70b_existing_prompts_vllm_serve.py‎
Lines changed: 14 additions & 3 deletions b/‎experiments/generate_responses_llama_3_3_70b_existing_prompts_vllm_serve.py‎
Lines changed: 14 additions & 3 deletions
@@ -0,0 +1,109 @@
+# Copyright The Marin Authors
+# SPDX-License-Identifier: Apache-2.0
+
+"""
+Debug heterogeneous alignment pipeline with rejected-only opposite prompting.
+
+Chosen / infrastructure roles use Llama 3.3 70B Instruct.
+Rejected responses use Mixtral 8x7B Instruct with rejected_prompt_strategy=opposite.
+
+This is the F2 heterogeneous local-local `auto` validation with opposite-mode
+rejected responses. The expected response-orchestration shape is:
+
+- separate `chosen` and `rejected` child jobs
+- no forced dependency between them
+- rejected prompt construction uses the explicit opposite-mode system prompt
+
+Submit to Iris:
+
+    uv run iris --config lib/iris/examples/marin.yaml job run \
+        --no-wait \
+        --job-name align-debug-vllm-70b-mixtral-rejected-opposite-auto \
+        --cpu 4 \
+        --memory 16GB \
+        --disk 10GB \
+        --region us-central1 \
+        -- python experiments/align_debug_vllm_70b_mixtral_rejected_opposite.py
+"""
+
+from pathlib import Path
+
+from experiments.llama import llama_70b
+from experiments.models import llama_3_3_70b_instruct
+from marin.alignment.align import AlignConfig, align
+from marin.alignment.generate_responses import RejectedPromptStrategy
+from marin.alignment.inference_config import VLLMConfig
+from marin.execution.executor import executor_main
+
+SPEC_PATH = str(Path(__file__).parent / "posttrain" / "specs" / "openai_model_spec.jsonl")
+LLAMA_70B_GCS_PATH = "gs://marin-us-central1/models/meta-llama--Llama-3-3-70B-Instruct--6f6073b"
+MIXTRAL_8X7B_INSTRUCT_GCS_PATH = "gs://marin-us-central1/models/mistralai--Mixtral-8x7B-Instruct-v0-1--eba9230"
+
+llama_vllm = VLLMConfig(
+    model=LLAMA_70B_GCS_PATH,
+    tensor_parallel_size=4,
+    max_model_len=4096,
+    gpu_memory_utilization=0.9,
+    tpu_type="v5p-8",
+    disk="10g",
+    ram="256g",
+)
+
+mixtral_vllm = VLLMConfig(
+    model=MIXTRAL_8X7B_INSTRUCT_GCS_PATH,
+    tensor_parallel_size=4,
+    max_model_len=4096,
+    gpu_memory_utilization=0.9,
+    tpu_type="v5p-8",
+    disk="10g",
+    ram="256g",
+)
+
+align_config = AlignConfig(
+    ideation_model=llama_vllm,
+    extract_model=llama_vllm,
+    judge_model=llama_vllm,
+    covering_strength=2,
+    covering_seed=42,
+    ideation_workers=1,
+    concretize_workers=1,
+    extract_workers=1,
+    prompt_batch_size=4,
+    understanding_max_tokens=1024,
+    understanding_temperature=1.0,
+    concretize_max_tokens=1536,
+    concretize_temperature=1.0,
+    concretize_max_attempts=5,
+    extract_max_tokens=1024,
+    judge_workers=1,
+    judge_batch_size=4,
+    teacher_n=1,
+    teacher_temperature=0.7,
+    teacher_max_tokens=512,
+    rejected_n=1,
+    rejected_temperature=0.7,
+    rejected_max_tokens=512,
+    rejected_prompt_strategy=RejectedPromptStrategy.OPPOSITE,
+    judge_min_chosen_score=1.0,
+    judge_min_gap=0.0,
+    tokenizer="meta-llama/Llama-3.3-70B-Instruct",
+    statement_ids=["ask_clarifying_questions"],
+)
+
+dataset_steps = align(
+    name="debug_vllm_70b_mixtral_rejected_opposite_auto_smoke",
+    pretrained_model=llama_3_3_70b_instruct,
+    spec=SPEC_PATH,
+    model_config=llama_70b,
+    teacher_model=llama_vllm,
+    align_config=align_config,
+    dpo_config=None,
+    rejected_model=mixtral_vllm,
+    tags=["debug", "vllm", "70b", "mixtral-rejected", "opposite-mode"],
+)
+
+if __name__ == "__main__":
+    executor_main(
+        steps=dataset_steps,
+        description="Debug heterogeneous auto alignment with Mixtral rejected opposite-mode responses",
+    )
@@ -0,0 +1,104 @@
+# Copyright The Marin Authors
+# SPDX-License-Identifier: Apache-2.0
+
+"""
+Debug heterogeneous alignment pipeline with rejected-only opposite prompting.
+
+This is a fresh metrics-focused one-statement end-to-end rerun of the validated
+opposite-mode smoke so we can materialize standardized `vllm_metrics.json`
+artifacts without reusing the earlier cached outputs.
+
+Submit to Iris:
+
+    uv run iris --config lib/iris/examples/marin.yaml job run \
+        --no-wait \
+        --job-name align-debug-vllm-70b-mixtral-rejected-opposite-auto-metrics-fresh \
+        --cpu 4 \
+        --memory 16GB \
+        --disk 10GB \
+        --region us-central1 \
+        -- python experiments/align_debug_vllm_70b_mixtral_rejected_opposite_metrics.py
+"""
+
+from pathlib import Path
+
+from experiments.llama import llama_70b
+from experiments.models import llama_3_3_70b_instruct
+from marin.alignment.align import AlignConfig, align
+from marin.alignment.generate_responses import RejectedPromptStrategy
+from marin.alignment.inference_config import VLLMConfig
+from marin.execution.executor import executor_main
+
+SPEC_PATH = str(Path(__file__).parent / "posttrain" / "specs" / "openai_model_spec.jsonl")
+LLAMA_70B_GCS_PATH = "gs://marin-us-central1/models/meta-llama--Llama-3-3-70B-Instruct--6f6073b"
+MIXTRAL_8X7B_INSTRUCT_GCS_PATH = "gs://marin-us-central1/models/mistralai--Mixtral-8x7B-Instruct-v0-1--eba9230"
+DESCRIPTION = "Debug heterogeneous auto alignment with opposite-mode rejected responses and standardized vLLM metrics"
+
+llama_vllm = VLLMConfig(
+    model=LLAMA_70B_GCS_PATH,
+    tensor_parallel_size=4,
+    max_model_len=4096,
+    gpu_memory_utilization=0.9,
+    tpu_type="v5p-8",
+    disk="10g",
+    ram="256g",
+)
+
+mixtral_vllm = VLLMConfig(
+    model=MIXTRAL_8X7B_INSTRUCT_GCS_PATH,
+    tensor_parallel_size=4,
+    max_model_len=4096,
+    gpu_memory_utilization=0.9,
+    tpu_type="v5p-8",
+    disk="10g",
+    ram="256g",
+)
+
+align_config = AlignConfig(
+    ideation_model=llama_vllm,
+    extract_model=llama_vllm,
+    judge_model=llama_vllm,
+    covering_strength=2,
+    covering_seed=42,
+    ideation_workers=1,
+    concretize_workers=1,
+    extract_workers=1,
+    prompt_batch_size=4,
+    understanding_max_tokens=1024,
+    understanding_temperature=1.0,
+    concretize_max_tokens=1536,
+    concretize_temperature=1.0,
+    concretize_max_attempts=5,
+    extract_max_tokens=1024,
+    judge_workers=1,
+    judge_batch_size=4,
+    teacher_n=1,
+    teacher_temperature=0.7,
+    teacher_max_tokens=512,
+    rejected_n=1,
+    rejected_temperature=0.7,
+    rejected_max_tokens=512,
+    rejected_prompt_strategy=RejectedPromptStrategy.OPPOSITE,
+    judge_min_chosen_score=1.0,
+    judge_min_gap=0.0,
+    tokenizer="meta-llama/Llama-3.3-70B-Instruct",
+    statement_ids=["ask_clarifying_questions"],
+)
+
+dataset_steps = align(
+    name="debug_vllm_70b_mixtral_rejected_opposite_auto_smoke_metrics",
+    pretrained_model=llama_3_3_70b_instruct,
+    spec=SPEC_PATH,
+    model_config=llama_70b,
+    teacher_model=llama_vllm,
+    align_config=align_config,
+    dpo_config=None,
+    rejected_model=mixtral_vllm,
+    tags=["debug", "vllm", "70b", "mixtral-rejected", "opposite-mode", "metrics"],
+)
+
+if __name__ == "__main__":
+    executor_main(
+        steps=dataset_steps,
+        description=DESCRIPTION,
+    )
@@ -0,0 +1,84 @@
+# Copyright The Marin Authors
+# SPDX-License-Identifier: Apache-2.0
+
+"""
+Run standalone rejected-side opposite-mode response generation on a known-good prompts artifact.
+
+This validates the new fail-closed rejected-only `opposite` prompt strategy
+without involving the full alignment pipeline. The run uses the staged
+`us-central1` Llama 3.3 70B checkpoint and an existing prompt artifact that was
+generated successfully from the OpenAI model-spec smoke statement.
+
+Submit to Iris:
+
+    uv run iris --config lib/iris/examples/marin.yaml job run \
+        --no-wait \
+        --job-name generate-rejected-opposite-llama-3-3-70b-existing-prompts \
+        --cpu 4 \
+        --memory 16GB \
+        --disk 10GB \
+        --region us-central1 \
+        -- python experiments/generate_rejected_opposite_llama_3_3_70b_existing_prompts.py
+"""
+
+from __future__ import annotations
+
+from pathlib import Path
+
+from experiments.models import llama_3_3_70b_instruct
+from marin.alignment.generate_responses import (
+    RejectedPromptStrategy,
+    ResponseGenConfig,
+    ResponseRole,
+    generate_responses,
+)
+from marin.alignment.inference_config import VLLMConfig
+from marin.execution.executor import ExecutorStep, executor_main, output_path_of, this_output_path
+from marin.execution.remote import remote
+
+PROMPTS_PATH = "gs://marin-us-central1/align/debug_generate_prompts_llama_3_3_70b_refactored/prompts-f29568"
+SPEC_PATH = str(Path(__file__).parent / "posttrain" / "specs" / "openai_model_spec.jsonl")
+MODEL_STEP = llama_3_3_70b_instruct
+DESCRIPTION = (
+    "Standalone rejected-only opposite-mode generation on existing prompts with staged us-central1 Llama 3.3 70B"
+)
+
+
+llama_3_3_70b_vllm = VLLMConfig(
+    model=output_path_of(MODEL_STEP),
+    tensor_parallel_size=4,
+    max_model_len=4096,
+    gpu_memory_utilization=0.9,
+    tpu_type="v5p-8",
+    disk="5g",
+    ram="256g",
+)
+
+response_step = ExecutorStep(
+    name="align/debug_generate_rejected_opposite_llama_3_3_70b_existing_prompts/responses",
+    description="Generate rejected-only opposite-mode responses on a known-good prompts artifact",
+    fn=remote(
+        generate_responses,
+        resources=llama_3_3_70b_vllm.resources,
+        env_vars={"MARIN_VLLM_MODE": "native"},
+        pip_dependency_groups=["vllm", "tpu"],
+    ),
+    config=ResponseGenConfig(
+        prompts_path=PROMPTS_PATH,
+        output_path=this_output_path(),
+        model_config=llama_3_3_70b_vllm,
+        role=ResponseRole.REJECTED,
+        rejected_prompt_strategy=RejectedPromptStrategy.OPPOSITE,
+        n=1,
+        temperature=0.7,
+        max_tokens=512,
+        behavior_statements_path=SPEC_PATH,
+    ),
+)
+
+
+if __name__ == "__main__":
+    executor_main(
+        steps=[response_step],
+        description=DESCRIPTION,
+    )
@@ -23,7 +23,12 @@
 from __future__ import annotations
 
 from experiments.models import llama_3_3_70b_instruct
-from marin.alignment.generate_responses import ResponseGenConfig, generate_responses
+from marin.alignment.generate_responses import (
+    RejectedPromptStrategy,
+    ResponseGenConfig,
+    ResponseRole,
+    generate_responses,
+)
 from marin.alignment.inference_config import VLLMConfig
 from marin.execution.executor import ExecutorStep, executor_main, output_path_of, this_output_path
 from marin.execution.remote import remote
@@ -54,10 +59,11 @@
         prompts_path=PROMPTS_PATH,
         output_path=this_output_path(),
         model_config=llama_3_3_70b_vllm,
+        role=ResponseRole.REJECTED,
+        rejected_prompt_strategy=RejectedPromptStrategy.UNGUIDED,
         n=1,
         temperature=0.7,
         max_tokens=512,
-        behavior_statements_path=None,
     ),
 )
 
 
@@ -22,7 +22,12 @@
 from __future__ import annotations
 
 from experiments.models import llama_3_3_70b_instruct
-from marin.alignment.generate_responses import ResponseGenConfig, generate_responses
+from marin.alignment.generate_responses import (
+    RejectedPromptStrategy,
+    ResponseGenConfig,
+    ResponseRole,
+    generate_responses,
+)
 from marin.alignment.inference_config import VLLMConfig
 from marin.execution.executor import ExecutorStep, executor_main, output_path_of, this_output_path
 from marin.execution.remote import remote
@@ -60,10 +65,11 @@
         prompts_path=PROMPTS_PATH,
         output_path=this_output_path(),
         model_config=llama_3_3_70b_vllm,
+        role=ResponseRole.REJECTED,
+        rejected_prompt_strategy=RejectedPromptStrategy.UNGUIDED,
         n=1,
         temperature=0.7,
         max_tokens=512,
-        behavior_statements_path=None,
     ),
 )
 
 
@@ -38,7 +38,12 @@
 
 from experiments.models import llama_3_3_70b_instruct
 from marin.alignment.generate_prompts import load_sharded_jsonl_gz, write_sharded_jsonl_gz
-from marin.alignment.generate_responses import _build_messages, _make_response_record
+from marin.alignment.generate_responses import (
+    RejectedPromptStrategy,
+    ResponseRole,
+    _build_rejected_messages,
+    _make_response_record,
+)
 from marin.alignment.inference_config import VLLMConfig
 from marin.evaluation.evaluators.evaluator import ModelConfig
 from marin.execution.executor import ExecutorStep, executor_main, output_path_of, this_output_path
@@ -91,7 +96,7 @@ def _request_one(
     max_tokens: int,
     n: int,
 ) -> dict[str, Any]:
-    messages = _build_messages(prompt, behavior_statements=None)
+    messages = _build_rejected_messages(prompt, RejectedPromptStrategy.UNGUIDED, None)
     response = requests.post(
         f"{server_url}/chat/completions",
         json={
@@ -108,7 +113,13 @@ def _request_one(
     responses = [
         {"content": choice["message"]["content"] or "", "index": idx} for idx, choice in enumerate(payload["choices"])
     ]
-    return _make_response_record(prompt, model_path, responses)
+    return _make_response_record(
+        prompt,
+        model_path,
+        responses,
+        role=ResponseRole.REJECTED,
+        rejected_prompt_strategy=RejectedPromptStrategy.UNGUIDED,
+    )
 
 
 def generate_responses_via_vllm_serve(config: VllmServeResponseGenConfig) -> None: