diff --git a/notebooks/difficulty_analysis_pipeline/analyze_human_model_mismatches.py b/notebooks/difficulty_analysis_pipeline/analyze_human_model_mismatches.py new file mode 100644 index 0000000..4776c99 --- /dev/null +++ b/notebooks/difficulty_analysis_pipeline/analyze_human_model_mismatches.py @@ -0,0 +1,156 @@ +#!/usr/bin/env python3 +""" +Analyze mismatches between human difficulty assessments and model performance. +""" + +import pandas as pd +import yaml +from pathlib import Path + +def load_human_difficulty_labels(): + human_labels = {} + # TODO: Set path to your terminal-bench repository + terminal_bench_path = Path.home() / "path/to/terminal-bench" / "tasks" + + if terminal_bench_path.exists(): + for task_dir in terminal_bench_path.iterdir(): + if not task_dir.is_dir(): + continue + task_yaml_path = task_dir / "task.yaml" + if not task_yaml_path.exists(): + continue + try: + with open(task_yaml_path, 'r') as f: + task_config = yaml.safe_load(f) + task_name = task_dir.name + difficulty = task_config.get('difficulty', 'unknown') + if difficulty != 'unknown': + human_labels[task_name] = difficulty.lower() + except: + continue + + return human_labels + +def load_data(): + difficulty_file = "difficulty_analysis_results/task_difficulty.csv" + if not Path(difficulty_file).exists(): + return None, None, None + + model_df = pd.read_csv(difficulty_file) + human_labels = load_human_difficulty_labels() + + time_file = "../time_analysis_pipeline/time_analysis_results/human_model_time_comparison.csv" + human_df = None + if Path(time_file).exists(): + human_df = pd.read_csv(time_file) + + return model_df, human_df, human_labels + +def analyze_all_tasks(model_df, human_labels): + model_df_enhanced = model_df.copy() + model_df_enhanced['human_difficulty'] = model_df_enhanced['task_name'].map(human_labels) + + with_human_labels = model_df_enhanced[model_df_enhanced['human_difficulty'].notna()].copy() + without_human_labels = model_df_enhanced[model_df_enhanced['human_difficulty'].isna()].copy() + universal_failures = model_df_enhanced[model_df_enhanced['model_resolve_rate'] == 0.0].copy() + + if len(with_human_labels) > 0: + difficulty_order = {'easy': 1, 'medium': 2, 'hard': 3} + with_human_labels['model_difficulty_num'] = with_human_labels['model_difficulty'].map(difficulty_order) + with_human_labels['human_difficulty_num'] = with_human_labels['human_difficulty'].map(difficulty_order) + with_human_labels['mismatch_score'] = with_human_labels['human_difficulty_num'] - with_human_labels['model_difficulty_num'] + + with_human_labels['mismatch_type'] = 'aligned' + with_human_labels.loc[with_human_labels['mismatch_score'] > 0, 'mismatch_type'] = 'model_easier' + with_human_labels.loc[with_human_labels['mismatch_score'] < 0, 'mismatch_type'] = 'human_easier' + + return model_df_enhanced, with_human_labels, without_human_labels, universal_failures + +def create_edge_case_record(row, case_type, human_df=None): + task_name = row['task_name'] + + expert_time = 'N/A' + junior_time = 'N/A' + if human_df is not None: + human_time_data = human_df[human_df['task_name'] == task_name] + if len(human_time_data) > 0: + expert_time = human_time_data.iloc[0].get('expert_time_estimate_min', 'N/A') + junior_time = human_time_data.iloc[0].get('junior_time_estimate_min', 'N/A') + + resolving_models = eval(row['resolving_models']) if row['resolving_models'] != '[]' else [] + + return { + 'type': case_type, + 'task_name': task_name, + 'human_difficulty': row.get('human_difficulty', 'unknown'), + 'model_difficulty': row['model_difficulty'], + 'model_resolve_rate': row['model_resolve_rate'], + 'models_that_solve': len(resolving_models), + 'total_models_tested': row['total_models_tested'], + 'expert_time_min': expert_time, + 'junior_time_min': junior_time, + 'mismatch_score': row.get('mismatch_score', 'N/A') + } + +def find_edge_cases(all_tasks_df, with_human_labels_df, without_human_labels_df, universal_failures_df, human_df=None): + edge_cases = [] + + # Universal failures with human labels + universal_with_human = universal_failures_df[universal_failures_df['human_difficulty'].notna()] + for _, row in universal_with_human.iterrows(): + edge_case = create_edge_case_record(row, 'universal_failure_with_human_label', human_df) + edge_cases.append(edge_case) + + # Universal failures without human labels + universal_without_human = universal_failures_df[universal_failures_df['human_difficulty'].isna()] + for _, row in universal_without_human.iterrows(): + edge_case = create_edge_case_record(row, 'universal_failure_no_human_label', human_df) + edge_cases.append(edge_case) + + if len(with_human_labels_df) > 0: + # Tasks where models find it easier than humans + model_easier = with_human_labels_df[with_human_labels_df['mismatch_type'] == 'model_easier'].copy() + model_easier = model_easier.sort_values('mismatch_score', ascending=False) + for _, row in model_easier.iterrows(): + edge_case = create_edge_case_record(row, 'model_easier', human_df) + edge_cases.append(edge_case) + + # Tasks where humans find it easier than models + human_easier = with_human_labels_df[with_human_labels_df['mismatch_type'] == 'human_easier'].copy() + human_easier = human_easier.sort_values('mismatch_score', ascending=True) + for _, row in human_easier.iterrows(): + edge_case = create_edge_case_record(row, 'human_easier', human_df) + edge_cases.append(edge_case) + + return edge_cases + +def save_results(edge_cases, all_tasks_df): + output_dir = Path("difficulty_analysis_results") + output_dir.mkdir(exist_ok=True) + + # Save edge cases + edge_cases_df = pd.DataFrame(edge_cases) + edge_cases_file = output_dir / "comprehensive_human_model_mismatches.csv" + edge_cases_df.to_csv(edge_cases_file, index=False) + + # Save full analysis + all_tasks_file = output_dir / "all_tasks_human_model_comparison.csv" + all_tasks_df.to_csv(all_tasks_file, index=False) + + return len(edge_cases) + +def main(): + model_df, human_df, human_labels = load_data() + if model_df is None: + return + + all_tasks_df, with_human_labels_df, without_human_labels_df, universal_failures_df = analyze_all_tasks(model_df, human_labels) + + edge_cases = find_edge_cases(all_tasks_df, with_human_labels_df, without_human_labels_df, universal_failures_df, human_df) + + edge_case_count = save_results(edge_cases, all_tasks_df) + + print(f"Analyzed {len(all_tasks_df)} tasks, found {edge_case_count} edge cases") + +if __name__ == "__main__": + main() diff --git a/notebooks/difficulty_analysis_pipeline/difficulty_analysis.ipynb b/notebooks/difficulty_analysis_pipeline/difficulty_analysis.ipynb new file mode 100644 index 0000000..5d60ece --- /dev/null +++ b/notebooks/difficulty_analysis_pipeline/difficulty_analysis.ipynb @@ -0,0 +1,459 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Task Difficulty Analysis Pipeline\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We compare:\n", + "\n", + "1. MODEL DIFFICULTY (Empirical):\n", + "- **Model resolve rate** = (models that solve task) / (total models tested)\n", + "- **Classification**:\n", + " - Easy: >= 66.7% of models solve it\n", + " - Medium: 33.3%-66.6% of models solve it \n", + " - Hard: < 33.3% of models solve it\n", + "\n", + "This gives us empirical difficulty based on actual model performance.\n", + "\n", + "2. HUMAN DIFFICULTY (Predicted):\n", + "- **Human labels** from terminal-bench dataset task definitions\n", + "- Categories: medium, hard\n", + "- Based on human assessment of task complexity\n", + "\n", + "3. DIFFICULTY MATRIX:\n", + "Creates a confusion matrix comparing human predictions vs empirical model performance.\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import json\n", + "import pandas as pd\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "from pathlib import Path\n", + "from datetime import datetime\n", + "import matplotlib.colors as mcolors\n", + "import toml\n", + "import yaml\n", + "\n", + "# TODO: Set path to your terminus2 data directory (output from get_terminus2_runs.py)\n", + "TRAJECTORY_DIR = \"\" # e.g., \"../../../terminus2_9-17_essential_files\"\n", + "RESULTS_DIR = \"difficulty_analysis_results\"\n", + "Path(RESULTS_DIR).mkdir(exist_ok=True)\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def extract_trial_data(trial_dir):\n", + " result_path = trial_dir / \"result.json\"\n", + " if not result_path.exists():\n", + " return None\n", + " \n", + " try:\n", + " with open(result_path) as f:\n", + " result = json.load(f)\n", + " \n", + " verifier_result = result.get('verifier_result') or {}\n", + " reward = verifier_result.get('reward', 0) if isinstance(verifier_result, dict) else 0\n", + " \n", + " data = {\n", + " 'trial_id': result.get('id'),\n", + " 'trial_name': result.get('trial_name'),\n", + " 'model_name': result.get('agent_info', {}).get('model_info', {}).get('name'),\n", + " 'agent_name': result.get('agent_info', {}).get('name'),\n", + " 'task_name': result.get('task_name'),\n", + " 'reward': reward,\n", + " 'success': reward > 0,\n", + " 'trial_uri': result.get('trial_uri'),\n", + " 'created_at': result.get('created_at'),\n", + " }\n", + " \n", + " for phase in ['setup', 'execution']:\n", + " phase_data = result.get(f'agent_{phase}', {})\n", + " start = phase_data.get('started_at')\n", + " end = phase_data.get('finished_at')\n", + " if start and end:\n", + " start_dt = datetime.fromisoformat(start.replace('Z', '+00:00'))\n", + " end_dt = datetime.fromisoformat(end.replace('Z', '+00:00'))\n", + " data[f'agent_{phase}_time_sec'] = (end_dt - start_dt).total_seconds()\n", + " else:\n", + " data[f'agent_{phase}_time_sec'] = None\n", + " \n", + " return data\n", + " except:\n", + " return None\n", + "\n", + "def extract_all_trials(trajectories_dir=TRAJECTORY_DIR, output_dir=RESULTS_DIR):\n", + " trajectories_path = Path(trajectories_dir)\n", + " if not trajectories_path.exists():\n", + " return {}, pd.DataFrame()\n", + " \n", + " output_path = Path(output_dir)\n", + " output_path.mkdir(exist_ok=True)\n", + " \n", + " cache_path = output_path / \"trials_cache.json\"\n", + " trials_dict = {}\n", + " if cache_path.exists():\n", + " with open(cache_path) as f:\n", + " trials_dict = json.load(f)\n", + " \n", + " trial_dirs = [d for d in trajectories_path.iterdir() if d.is_dir()]\n", + " new_count = 0\n", + " \n", + " for trial_dir in trial_dirs:\n", + " trial_id = trial_dir.name\n", + " if trial_id not in trials_dict:\n", + " trial_data = extract_trial_data(trial_dir)\n", + " if trial_data:\n", + " trials_dict[trial_id] = trial_data\n", + " new_count += 1\n", + " \n", + " if new_count > 0:\n", + " with open(cache_path, 'w') as f:\n", + " json.dump(trials_dict, f, indent=2)\n", + " \n", + " return trials_dict, pd.DataFrame(list(trials_dict.values()))\n", + "\n", + "trials_dict, trials_df = extract_all_trials()\n", + "trials_df.to_csv(f\"{RESULTS_DIR}/trials_raw.csv\", index=False)\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def calculate_model_task_performance(trials_df):\n", + " trials_df = trials_df.drop_duplicates('trial_id')\n", + " \n", + " grouped = trials_df.groupby(['model_name', 'task_name']).agg({\n", + " 'trial_id': ['count', list],\n", + " 'trial_name': list,\n", + " 'success': ['sum', list],\n", + " 'agent_execution_time_sec': list,\n", + " 'agent_setup_time_sec': list,\n", + " }).reset_index()\n", + " \n", + " grouped.columns = ['model_name', 'task_name', 'total_trials', 'trial_ids', 'trial_names',\n", + " 'successful_trials', 'success_list', 'execution_times_sec', 'setup_times_sec']\n", + " \n", + " grouped['success_rate'] = grouped['successful_trials'] / grouped['total_trials']\n", + " grouped['resolves_task'] = grouped['successful_trials'] > (grouped['total_trials'] / 2)\n", + " \n", + " grouped['successful_trial_ids'] = grouped.apply(\n", + " lambda row: [tid for tid, success in zip(row['trial_ids'], row['success_list']) if success], \n", + " axis=1\n", + " )\n", + " \n", + " grouped = grouped.drop(['success_list'], axis=1)\n", + " return grouped\n", + "\n", + "performance_df = calculate_model_task_performance(trials_df)\n", + "performance_df.to_csv(f\"{RESULTS_DIR}/model_task_performance.csv\", index=False)\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def calculate_task_resolution(performance_df):\n", + " task_groups = performance_df.groupby('task_name').agg({\n", + " 'model_name': list,\n", + " 'resolves_task': ['count', 'sum', list],\n", + " }).reset_index()\n", + " \n", + " task_groups.columns = ['task_name', 'all_models', 'total_models_tested', 'models_that_resolve', 'resolve_list']\n", + " \n", + " task_groups['resolving_models'] = task_groups.apply(\n", + " lambda row: [model for model, resolves in zip(row['all_models'], row['resolve_list']) if resolves],\n", + " axis=1\n", + " )\n", + " \n", + " task_groups['non_resolving_models'] = task_groups.apply(\n", + " lambda row: [model for model, resolves in zip(row['all_models'], row['resolve_list']) if not resolves],\n", + " axis=1\n", + " )\n", + " \n", + " task_groups['model_resolve_rate'] = task_groups['models_that_resolve'] / task_groups['total_models_tested']\n", + " task_groups = task_groups.drop(['all_models', 'resolve_list'], axis=1)\n", + " \n", + " return task_groups\n", + "\n", + "resolution_df = calculate_task_resolution(performance_df)\n", + "resolution_df.to_csv(f\"{RESULTS_DIR}/task_resolution.csv\", index=False)\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def classify_task_difficulty(resolution_df):\n", + " def classify_difficulty(resolve_rate):\n", + " if resolve_rate >= 0.667:\n", + " return 'easy'\n", + " elif resolve_rate >= 0.333:\n", + " return 'medium'\n", + " else:\n", + " return 'hard'\n", + " \n", + " difficulty_df = resolution_df.copy()\n", + " difficulty_df['model_difficulty'] = difficulty_df['model_resolve_rate'].apply(classify_difficulty)\n", + " difficulty_df['human_difficulty'] = None\n", + " \n", + " cols = ['task_name', 'model_resolve_rate', 'model_difficulty', 'human_difficulty', \n", + " 'total_models_tested', 'models_that_resolve', 'resolving_models', 'non_resolving_models']\n", + " difficulty_df = difficulty_df[cols]\n", + " \n", + " return difficulty_df\n", + "\n", + "difficulty_df = classify_task_difficulty(resolution_df)\n", + "difficulty_df.to_csv(f\"{RESULTS_DIR}/task_difficulty.csv\", index=False)\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def load_human_difficulty_labels():\n", + " human_labels = {}\n", + " \n", + " # TODO: Set path to your terminal-bench-2.0-dataset repository\n", + " terminal_bench_2_path = Path.home() / \"path/to/terminal-bench-2.0-dataset\" / \"tasks\"\n", + " if terminal_bench_2_path.exists():\n", + " for task_dir in terminal_bench_2_path.iterdir():\n", + " if not task_dir.is_dir():\n", + " continue\n", + " task_toml_path = task_dir / \"task.toml\"\n", + " if not task_toml_path.exists():\n", + " continue\n", + " try:\n", + " with open(task_toml_path, 'r') as f:\n", + " task_config = toml.load(f)\n", + " task_name = task_dir.name\n", + " difficulty = task_config.get('metadata', {}).get('difficulty', 'unknown')\n", + " if difficulty != 'unknown':\n", + " human_labels[task_name] = difficulty.lower()\n", + " except:\n", + " pass\n", + " \n", + " # TODO: Set path to your terminal-bench repository\n", + " terminal_bench_path = Path.home() / \"path/to/terminal-bench\" / \"tasks\"\n", + " if terminal_bench_path.exists():\n", + " for task_dir in terminal_bench_path.iterdir():\n", + " if not task_dir.is_dir():\n", + " continue\n", + " task_yaml_path = task_dir / \"task.yaml\"\n", + " if not task_yaml_path.exists():\n", + " continue\n", + " try:\n", + " with open(task_yaml_path, 'r') as f:\n", + " task_config = yaml.safe_load(f)\n", + " task_name = task_dir.name\n", + " difficulty = task_config.get('difficulty', 'unknown')\n", + " if difficulty != 'unknown' and task_name not in human_labels:\n", + " human_labels[task_name] = difficulty.lower()\n", + " except:\n", + " pass\n", + " \n", + " return human_labels\n", + "\n", + "def create_confusion_matrix(difficulty_df):\n", + " human_labels = load_human_difficulty_labels()\n", + " \n", + " def get_human_difficulty(task_name):\n", + " return human_labels.get(task_name, 'unknown')\n", + " \n", + " difficulty_df['human_difficulty'] = difficulty_df['task_name'].apply(get_human_difficulty)\n", + " difficulty_df = difficulty_df[difficulty_df['human_difficulty'] != 'unknown']\n", + " \n", + " if len(difficulty_df) == 0:\n", + " return pd.DataFrame()\n", + " \n", + " confusion = pd.crosstab(\n", + " difficulty_df['human_difficulty'], \n", + " difficulty_df['model_difficulty'],\n", + " margins=False\n", + " )\n", + " \n", + " human_categories = ['hard', 'medium']\n", + " empirical_categories = ['easy', 'medium', 'hard']\n", + " \n", + " confusion = confusion.reindex(\n", + " index=human_categories, \n", + " columns=empirical_categories, \n", + " fill_value=0\n", + " )\n", + " \n", + " return confusion\n", + "\n", + "def plot_compact_heatmap(confusion_matrix, output_base, normalize=False):\n", + " plt.rcParams['figure.dpi'] = 300\n", + " plt.rcParams['savefig.dpi'] = 300\n", + " \n", + " fig, ax = plt.subplots(figsize=(4.2, 3.6))\n", + " \n", + " if normalize:\n", + " confusion_normalized = confusion_matrix.div(confusion_matrix.sum(axis=1), axis=0) * 100\n", + " plot_data = confusion_normalized.values\n", + " colorbar_label = 'Percentage of Tasks'\n", + " value_format = '.1f'\n", + " value_suffix = '%'\n", + " else:\n", + " plot_data = confusion_matrix.values\n", + " colorbar_label = 'Number of Tasks'\n", + " value_format = 'd'\n", + " value_suffix = ''\n", + " \n", + " colors = ['#f7f7f7', '#c6dbef', '#6baed6', '#3182bd', '#08519c']\n", + " cmap = mcolors.LinearSegmentedColormap.from_list('custom_blues', colors, N=256)\n", + " \n", + " im = ax.imshow(plot_data, cmap=cmap, aspect='equal')\n", + " \n", + " cbar = plt.colorbar(im, ax=ax, shrink=0.5, pad=0.05)\n", + " cbar.set_label(colorbar_label, rotation=90, labelpad=10, fontsize=10)\n", + " cbar.ax.tick_params(labelsize=9)\n", + " \n", + " ax.set_xticks(range(len(confusion_matrix.columns)))\n", + " ax.set_yticks(range(len(confusion_matrix.index)))\n", + " ax.set_xticklabels([col.capitalize() for col in confusion_matrix.columns], fontsize=11)\n", + " ax.set_yticklabels([idx.capitalize() for idx in confusion_matrix.index], fontsize=11)\n", + " \n", + " for i in range(len(confusion_matrix.index)):\n", + " for j in range(len(confusion_matrix.columns)):\n", + " if normalize:\n", + " value = confusion_normalized.iloc[i, j]\n", + " display_value = f\"{value:{value_format}}{value_suffix}\"\n", + " else:\n", + " value = confusion_matrix.iloc[i, j]\n", + " display_value = f\"{value:{value_format}}{value_suffix}\"\n", + " \n", + " text_color = 'black' if value < plot_data.max() * 0.6 else 'white'\n", + " ax.text(j, i, display_value, \n", + " ha=\"center\", va=\"center\", \n", + " color=text_color, \n", + " fontsize=12, \n", + " fontweight='bold')\n", + " \n", + " plt.title('Task Difficulty Matrix', fontsize=12, pad=15, fontweight='bold')\n", + " plt.xlabel('Empirical Difficulty', fontsize=10, fontweight='bold', labelpad=8)\n", + " plt.ylabel('Human-Predicted Difficulty', fontsize=10, fontweight='bold', labelpad=8)\n", + " \n", + " ax.set_xticks(np.arange(len(confusion_matrix.columns)) - 0.5, minor=True)\n", + " ax.set_yticks(np.arange(len(confusion_matrix.index)) - 0.5, minor=True)\n", + " ax.grid(which=\"minor\", color=\"white\", linestyle='-', linewidth=2)\n", + " ax.tick_params(which=\"minor\", size=0)\n", + " \n", + " for spine in ax.spines.values():\n", + " spine.set_visible(False)\n", + " \n", + " plt.tight_layout(pad=0.8)\n", + " \n", + " output_file = f\"{output_base}.png\"\n", + " plt.savefig(output_file, \n", + " dpi=300,\n", + " bbox_inches='tight', \n", + " pad_inches=0.05,\n", + " facecolor='white',\n", + " edgecolor='none')\n", + " \n", + " plt.show()\n", + " return confusion_matrix\n", + "\n", + "# Update CSV with human difficulty labels\n", + "def load_human_labels_for_csv():\n", + " human_labels = {}\n", + " \n", + " # TODO: Set path to your terminal-bench-2.0-dataset repository\n", + " path_2_0 = Path.home() / \"path/to/terminal-bench-2.0-dataset\" / \"tasks\"\n", + " if path_2_0.exists():\n", + " for task_dir in path_2_0.iterdir():\n", + " if not task_dir.is_dir():\n", + " continue\n", + " task_toml = task_dir / \"task.toml\"\n", + " if not task_toml.exists():\n", + " continue\n", + " try:\n", + " with open(task_toml, 'r') as f:\n", + " config = toml.load(f)\n", + " difficulty = config.get('metadata', {}).get('difficulty', 'unknown')\n", + " if difficulty != 'unknown':\n", + " human_labels[task_dir.name] = difficulty.lower()\n", + " except:\n", + " pass\n", + " \n", + " # TODO: Set path to your terminal-bench repository\n", + " path_orig = Path.home() / \"path/to/terminal-bench\" / \"tasks\"\n", + " if path_orig.exists():\n", + " for task_dir in path_orig.iterdir():\n", + " if not task_dir.is_dir():\n", + " continue\n", + " task_yaml = task_dir / \"task.yaml\"\n", + " if not task_yaml.exists():\n", + " continue\n", + " try:\n", + " with open(task_yaml, 'r') as f:\n", + " config = yaml.safe_load(f)\n", + " task_name = task_dir.name\n", + " difficulty = config.get('difficulty', 'unknown')\n", + " if difficulty != 'unknown' and task_name not in human_labels:\n", + " human_labels[task_name] = difficulty.lower()\n", + " except:\n", + " pass\n", + " \n", + " return human_labels\n", + "\n", + "# Update difficulty_df with human labels\n", + "human_labels_for_csv = load_human_labels_for_csv()\n", + "difficulty_df['human_difficulty'] = difficulty_df['task_name'].map(human_labels_for_csv)\n", + "difficulty_df.to_csv(f\"{RESULTS_DIR}/task_difficulty.csv\", index=False)\n", + "\n", + "confusion = create_confusion_matrix(difficulty_df)\n", + "if len(confusion) > 0:\n", + " plot_compact_heatmap(confusion, f\"{RESULTS_DIR}/difficulty_heatmap_normalized\", normalize=True)\n" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": ".venv", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.13.5" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/notebooks/difficulty_analysis_pipeline/results/difficulty_heatmap_normalized.png b/notebooks/difficulty_analysis_pipeline/results/difficulty_heatmap_normalized.png new file mode 100644 index 0000000..8c1ad90 Binary files /dev/null and b/notebooks/difficulty_analysis_pipeline/results/difficulty_heatmap_normalized.png differ diff --git a/notebooks/difficulty_analysis_pipeline/results/model_task_performance.csv b/notebooks/difficulty_analysis_pipeline/results/model_task_performance.csv new file mode 100644 index 0000000..fc542ab --- /dev/null +++ b/notebooks/difficulty_analysis_pipeline/results/model_task_performance.csv @@ -0,0 +1,1185 @@ +model_name,task_name,total_trials,trial_ids,trial_names,successful_trials,execution_times_sec,setup_times_sec,success_rate,resolves_task,successful_trial_ids +OpenAI/gpt-oss-20B,adaptive-rejection-sampler,5,"['561d7842-83b8-4a42-b69a-65cf1e9fad86', '8afc75a0-d7fa-476a-8446-a550a85dfed3', 'bfa8776a-80a9-415d-852c-96443f9b1d53', '151073a2-a54b-4f6e-8442-b7fbf8ed6d8b', '7bd796df-e2b8-4d9e-9ba7-79fcc6617b53']","['adaptive-rejection-sampler__XZiZTFd', 'adaptive-rejection-sampler__8n5ggAM', 'adaptive-rejection-sampler__gxfqL2r', 'adaptive-rejection-sampler__p55YjWV', 'adaptive-rejection-sampler__QPav52F']",0,"[356.535976, 143.258045, 85.64665, 133.689527, 155.80654]","[36.204383, 50.093515, 26.960509, 137.441468, 57.103727]",0.0,False,[] +OpenAI/gpt-oss-20B,bn-fit-modify,5,"['4bba3d44-015c-4200-b85a-ab3e5c8aed1d', '5433cf05-62ee-421d-98a5-869a8e759388', '06212dbc-e651-40e9-b820-52531b9c06a2', '060c3b7f-3ca7-4d76-9679-50f464e8ee2a', '3f96f923-505b-417b-ba4c-db87355276a3']","['bn-fit-modify__itWp4xH', 'bn-fit-modify__3RiqRTz', 'bn-fit-modify__ZEB4GhA', 'bn-fit-modify__EAwb4U2', 'bn-fit-modify__twJvU7b']",0,"[1900.158172, 3603.325587, 79.49707, 254.911604, 138.079409]","[28.216681, 14.425012, 22.310754, 202.211089, 96.883074]",0.0,False,[] +OpenAI/gpt-oss-20B,break-filter-js-from-html,5,"['3e75109c-dca6-48d8-811a-5c11cd582bfc', 'bfb7ed66-7436-4b27-bd32-e7b979be28c0', '39a144f0-d030-4241-92e0-34e1aa0742b8', 'b30e7168-b15f-4fc1-ae27-dfd4ecd24dfc', '70adc40b-624b-4249-b8c4-71265ef42d2a']","['break-filter-js-from-html__uLoNBna', 'break-filter-js-from-html__JfRgzn8', 'break-filter-js-from-html__TYDqLuT', 'break-filter-js-from-html__Hx9WLLk', 'break-filter-js-from-html__BCbKkge']",0,"[91.586926, 65.606627, 91.90294, 104.0089, 247.076007]","[13.194741, 44.462491, 88.774913, 116.258986, 80.839722]",0.0,False,[] +OpenAI/gpt-oss-20B,build-cython-ext,5,"['76f5c077-dde5-4026-837f-1acfe41f861d', 'e722ba2f-8654-4ae3-804b-678cd2824d2a', '32f14803-ec52-440f-8a12-0cad8c9760ea', 'f69f4d15-4421-4a0f-8f73-2008d632673f', 'b13313d9-5438-46be-ae96-e0f67366f950']","['build-cython-ext__MQPLwV5', 'build-cython-ext__ztfPQcf', 'build-cython-ext__cJ3kLxr', 'build-cython-ext__S7VHE3p', 'build-cython-ext__MnHvsU4']",0,"[900.035396, 900.344872, 68.01344, 908.079582, 152.200359]","[53.304185, 12.091994, 88.384178, 64.562149, 70.577813]",0.0,False,[] +OpenAI/gpt-oss-20B,build-initramfs-qemu,5,"['fd0833bc-42b9-43c0-ace8-4ab501c51855', '735d02ac-4a7f-41d6-89de-177acbdfe2dc', '639ce984-cf12-41cc-ae92-21d7b63f7f30', 'e9a59387-1fcd-434b-bf47-ee3835be3fd8', '3bb03f30-e18b-4f4f-a320-aac0d1896623']","['build-initramfs-qemu__KXQSGU9', 'build-initramfs-qemu__g3CEhZ2', 'build-initramfs-qemu__jSvgtEE', 'build-initramfs-qemu__SaRY9cs', 'build-initramfs-qemu__ZB3f2Bw']",0,"[29.739768, 260.08733, 76.339363, 47.463443, 49.997346]","[10.189678, 72.982065, 153.2956, 7.903013, 26.253912]",0.0,False,[] +OpenAI/gpt-oss-20B,build-pmars,5,"['437f079f-caf5-48c8-95b1-89039ff6c5c9', 'e4da006e-8250-4cb3-b54c-42d38e2be7cd', '5b43a50e-c179-4749-bec9-4e61b6a09273', '0e064c95-5952-48c4-a446-b36343aef6d4', '053f8996-cefb-46ab-9ef1-78234c2cf87c']","['build-pmars__LzCa6K8', 'build-pmars__Zac5Msa', 'build-pmars__oGMtgvC', 'build-pmars__bo4BQeK', 'build-pmars__pfEaEPa']",0,"[235.343206, 900.788083, 155.506388, 93.49419, 926.337452]","[2.984802, 36.048627, 9.480113, 11.479001, 29.737258]",0.0,False,[] +OpenAI/gpt-oss-20B,build-pov-ray,5,"['74324bec-f1be-4d47-a7cc-b72993ddc0da', '6ccc8c1a-2433-4123-ae3e-7d6bb58f5d19', '18aab19a-ca7e-444b-8372-dda7abb9b3f9', 'c941f4df-e03f-4abf-ad88-8de43c3be3bf', 'ac89b36e-386b-4d93-813d-c24e88224aae']","['build-pov-ray__txpnc9X', 'build-pov-ray__5db5ngt', 'build-pov-ray__HwQDfe5', 'build-pov-ray__8FP83uq', 'build-pov-ray__VewweaW']",0,"[130.354514, 788.412803, 250.990985, 110.50938, 106.784039]","[76.700355, 70.701523, 9.128604, 37.147718, 37.693313]",0.0,False,[] +OpenAI/gpt-oss-20B,cancel-async-tasks,5,"['48158799-107d-421b-b34e-02fa5a8d38c5', 'a322daa4-5bd5-44b2-ac24-f699a5301179', '65793433-8b24-453c-8d2e-343f8ad68ecc', '71170a6c-0013-4658-9225-e1c911803c0d', '2292ab98-2e7a-4557-a861-3a55dc2f308c']","['cancel-async-tasks__2KbotSd', 'cancel-async-tasks__Tfug3LY', 'cancel-async-tasks__E68Su68', 'cancel-async-tasks__5fSQ4X4', 'cancel-async-tasks__cmksCV9']",0,"[47.596013, 15.837117, 40.721059, 18.26774, 42.635609]","[51.303026, 85.78533, 56.108009, 162.581708, 64.591333]",0.0,False,[] +OpenAI/gpt-oss-20B,chess-best-move,5,"['3ea753e1-fe93-4202-af79-4ab725485edf', 'e6b5cecc-812d-43ed-a808-f36276f54b3e', 'd9161c9e-95b9-404e-8e29-5e2806179721', '07bec61b-b81e-430f-89af-0cd357b06d3b', '0a34123c-a794-4328-8737-19ad0a7087d4']","['chess-best-move__ABYdpxw', 'chess-best-move__FDQ5uTm', 'chess-best-move__YMpnusC', 'chess-best-move__CGFhTQm', 'chess-best-move__woxDZzA']",0,"[54.659025, 91.240332, 35.322172, 835.851092, 57.042881]","[36.503218, 98.528029, 66.665917, 13.25733, 6.722724]",0.0,False,[] +OpenAI/gpt-oss-20B,circuit-fibsqrt,5,"['120fc17b-a4a6-44d3-8086-4ab7ff3a8508', '11f82b89-1f7f-49b5-88d5-728824e335eb', '42979eaf-056d-47bf-b494-6908f91d1bee', '4ada5ba2-e124-4f16-b1d7-f3196cfd1fff', '790e2529-d424-46a6-947b-5d207053c57b']","['circuit-fibsqrt__vGKeDtL', 'circuit-fibsqrt__xf4h5FN', 'circuit-fibsqrt__Uydy5RB', 'circuit-fibsqrt__Qxzqf7K', 'circuit-fibsqrt__7YHZUv7']",0,"[285.791206, 103.985823, 81.249671, 78.605927, 2432.870014]","[8.37542, 24.721528, 15.490625, 34.264113, 33.115557]",0.0,False,[] +OpenAI/gpt-oss-20B,cobol-modernization,5,"['40b7f302-ba98-4531-9163-ea1f4de8db7f', 'b86f0b24-e961-43a0-8712-515abb171646', 'd42b7534-4973-449d-ac23-2c662367124f', 'fac03630-83fa-4994-9021-15a0789c8dbd', '512780bd-2799-47af-9c82-8aad4a47f567']","['cobol-modernization__RuRjt4q', 'cobol-modernization__UCpGBkb', 'cobol-modernization__HoBPpUr', 'cobol-modernization__4sKEgZP', 'cobol-modernization__t9pmwsK']",0,"[914.721612, 914.552962, 920.936867, 914.934667, 211.925308]","[46.229971, 50.802985, 119.210785, 53.693449, 55.889986]",0.0,False,[] +OpenAI/gpt-oss-20B,code-from-image,5,"['8c4b3e68-ae5f-449f-8144-73be29b7ab11', '924f6034-22de-4b5f-9daa-f5a9151f7a97', 'b35f5b57-f56d-4958-8137-8cc6e3d73957', 'a8d8de43-7c71-4506-a1b0-3bcb214dbbc4', 'bb589b01-66a6-4610-89ee-913042e7ac87']","['code-from-image__dr9u4bz', 'code-from-image__gB9Avso', 'code-from-image__gLcnyGW', 'code-from-image__QcBY6J9', 'code-from-image__ieWURHU']",0,"[89.516199, 64.803339, 42.88561, 30.53173, 32.796986]","[19.207764, 15.999952, 72.568905, 40.892161, 65.127544]",0.0,False,[] +OpenAI/gpt-oss-20B,configure-git-webserver,5,"['0acbeb7c-6c3a-404b-8dfe-a0d9aacc7d93', 'c9a872d7-0547-42ee-ad4c-6844c69dfc4c', '4ad19b08-5854-4974-bbe5-64e5328a55d8', '2ebc23fc-7ddb-41c6-832b-62bbf31be73e', '630206c4-0c29-4798-9ad7-8e52e574e5c3']","['configure-git-webserver__fYARQEy', 'configure-git-webserver__sig2Gs4', 'configure-git-webserver__qYcqCbL', 'configure-git-webserver__mUjqQiA', 'configure-git-webserver__HVEK744']",1,"[104.181251, 254.30957, 149.752211, 356.76794, 591.241932]","[37.562469, 49.190905, 58.829724, 30.004241, 94.294384]",0.2,False,['c9a872d7-0547-42ee-ad4c-6844c69dfc4c'] +OpenAI/gpt-oss-20B,constraints-scheduling,5,"['b0a6ac8e-5c70-4a73-b11f-022db4f66eae', 'f5fc4ce5-180d-4f1d-b0c2-07a7f72bc30f', '5b0725c5-1ab5-4b5d-a00f-150016e2fcdb', '9ae33fa8-67e9-453a-af59-1457992f1cac', 'a8ba26b7-655c-4485-983a-a3a3d551f68e']","['constraints-scheduling__zgmaRQ4', 'constraints-scheduling__Wmay4bu', 'constraints-scheduling__9LJ89WG', 'constraints-scheduling__4hhUprb', 'constraints-scheduling__Fjb4GCN']",1,"[192.806271, 74.12003, 206.900755, 195.872986, 311.04735]","[173.213973, 37.619493, 46.496881, 12.660308, 49.813399]",0.2,False,['9ae33fa8-67e9-453a-af59-1457992f1cac'] +OpenAI/gpt-oss-20B,count-dataset-tokens,5,"['9c57bd96-8700-4ff8-9b58-3999eb0b95c3', '72b2b9e6-09af-4650-93bc-9971a8660491', 'c0862183-8e5b-4ce4-a85d-61b58affe465', 'ef7c7d72-684c-42a7-a40f-1afbdbaab05d', '5f7e7074-edc2-48c1-b771-572113e7a02b']","['count-dataset-tokens__XJnHMp4', 'count-dataset-tokens__bdDmLNW', 'count-dataset-tokens__gqn8RiA', 'count-dataset-tokens__9tzGrwd', 'count-dataset-tokens__JQJQa2d']",0,"[914.908032, 250.126521, 731.413682, 902.607654, 904.826627]","[45.522409, 100.917241, 113.124475, 35.761084, 36.056869]",0.0,False,[] +OpenAI/gpt-oss-20B,crack-7z-hash,5,"['fdd94540-7594-49a7-bb23-783acb52fe21', 'c8b14e1d-3119-4e5d-93ca-39440cbfe117', '2add1490-1465-49a4-bafc-b9b1c19f266b', '5156ccac-113d-4a64-8dcd-bb3153ab89b5', '4dbe1823-00d9-4988-a879-f62258452369']","['crack-7z-hash__8Y3yt8B', 'crack-7z-hash__XU6ctyb', 'crack-7z-hash__cVbtCjG', 'crack-7z-hash__ZL2Q8DP', 'crack-7z-hash__zs9yQTK']",0,"[44.670902, 6.494683, 12.386415, 24.209075, 36.760144]","[26.584269, 10.58808, 18.531043, 135.177293, 24.363861]",0.0,False,[] +OpenAI/gpt-oss-20B,db-wal-recovery,5,"['11e10566-b462-43f1-9216-f805f03f0392', '23485f97-ff71-42ec-a1f9-1efda9e5d771', '5002fde0-a647-43d4-b942-0f9c6e1dc5ca', '3e4d3122-e7a6-40f3-8239-33e4e9706245', '4ae56090-760a-4635-9528-d708a6624d2e']","['db-wal-recovery__Koiy6sr', 'db-wal-recovery__qTkaN4v', 'db-wal-recovery__iLFsjSL', 'db-wal-recovery__AQoxUoP', 'db-wal-recovery__H3r4wDv']",0,"[148.530202, 106.632391, 68.550202, 326.298205, 59.896131]","[36.518805, 24.197566, 10.499421, 29.11496, 49.66205]",0.0,False,[] +OpenAI/gpt-oss-20B,distribution-search,5,"['648aceaf-ba05-44b2-bc7a-e02573892ee4', 'bf0a34aa-4602-4f5b-ab8f-30df5026db01', 'ebbfbed3-c4d8-4a8f-8a9c-ecf733f3dc47', 'c0a69b8a-d68b-4619-82c3-119c751921d9', '7f58e472-5978-450a-b836-97b96ec69a30']","['distribution-search__bQiHRJd', 'distribution-search__PwoC3Tj', 'distribution-search__xLgAwPJ', 'distribution-search__FGnyqqe', 'distribution-search__prGWwEC']",0,"[101.232021, 72.697168, 134.236845, 128.520165, 119.747625]","[25.475571, 55.929602, 28.122663, 114.620254, 90.097641]",0.0,False,[] +OpenAI/gpt-oss-20B,dna-assembly,5,"['13e970cf-3aa0-47ab-8c9a-303ec4e7b4ab', '679104e1-676c-4505-8748-5e96da2b5f67', '394fe1f8-c289-4c5c-b07e-a7169c09b8d0', 'd3aac658-dcd2-4c5b-a20d-318c6881e5c4', '7ec5016b-f239-40e8-9d01-f49574de6133']","['dna-assembly__NoBz4ih', 'dna-assembly__MTpxrq9', 'dna-assembly__hbXD4UG', 'dna-assembly__nxqfV2H', 'dna-assembly__8qRtQnj']",0,"[721.18646, 227.617005, 328.308152, 72.249329, 738.708681]","[62.102204, 52.349978, 51.167877, 16.412427, 35.561215]",0.0,False,[] +OpenAI/gpt-oss-20B,dna-insert,5,"['09868f26-ef68-4ba2-92c2-2b4624a6902f', '55dadd19-ba2b-4f0a-94cb-ba498bcf2bfa', 'c200ee65-6142-4bae-9d20-bea5f910505b', '623c665d-c336-4e94-8d21-e55ce2dd16bb', '72049f09-05fb-4284-944c-78cfc6d74d3e']","['dna-insert__3gdrMvg', 'dna-insert__665iEgQ', 'dna-insert__hfVCc2L', 'dna-insert__haN67ae', 'dna-insert__iqBPa6s']",0,"[366.914253, 422.784881, 372.228474, 585.561517, 382.027021]","[140.169489, 38.67192, 25.694569, 49.015927, 16.508326]",0.0,False,[] +OpenAI/gpt-oss-20B,extract-elf,5,"['90be352b-40b1-4d3b-aedb-7baca3e0d05f', '21a9659f-de06-42f2-9d1d-82b0b91f417e', '683d4f59-6d7f-422d-a42b-0a726b65423e', 'b47fcd39-a3cb-4d0e-992e-41c130136f58', '69e538e2-a590-4f11-bdbf-8ca774e0142d']","['extract-elf__HxD3cXX', 'extract-elf__XTnmypk', 'extract-elf__TDyDuXN', 'extract-elf__Li9cSdv', 'extract-elf__PnBWRxA']",1,"[42.176015, 902.545987, 143.858656, 57.894756, 90.621321]","[135.154087, 43.403232, 22.027285, 12.682398, 45.864086]",0.2,False,['69e538e2-a590-4f11-bdbf-8ca774e0142d'] +OpenAI/gpt-oss-20B,feal-differential-cryptanalysis,5,"['4b071e58-8132-4351-ac84-74de9436119f', '3dae731a-d189-4f14-bfa5-c1efb7d0d997', 'e0b03cca-11df-45ca-8229-5dcec2e172ce', '4f7db1d1-290c-4f6e-994a-ef7251203e4d', '3f097312-f313-44f8-a08e-d0b3be32473b']","['feal-differential-cryptanalysis__ekrPYfH', 'feal-differential-cryptanalysis__q3Pebio', 'feal-differential-cryptanalysis__YNrK3Hr', 'feal-differential-cryptanalysis__K3LSXkn', 'feal-differential-cryptanalysis__DbTrDxu']",0,"[65.323061, 231.52774, 2439.887236, 276.480175, 180.345809]","[23.30966, 95.029445, 180.08822, 16.562334, 36.411004]",0.0,False,[] +OpenAI/gpt-oss-20B,feal-linear-cryptanalysis,5,"['cc28009f-3117-4466-a75f-6fb0cf402b6e', '83f43bf6-9c3d-4b94-a868-e3bc947d5a29', '835e01a1-3a0c-4cd9-9ae1-62774e9554f8', '428be7b3-6c27-44ad-8e77-08cdf281d012', 'bfc30cf3-c2d1-484f-bd40-5cba87c9c021']","['feal-linear-cryptanalysis__ZdMJuCK', 'feal-linear-cryptanalysis__omrtvBe', 'feal-linear-cryptanalysis__8uPngxj', 'feal-linear-cryptanalysis__jccNrcZ', 'feal-linear-cryptanalysis__9MViabC']",0,"[1042.670139, 1814.977613, 1819.826953, 1848.56029, 1836.216547]","[63.468112, 37.619788, 43.779685, 27.273951, 61.348292]",0.0,False,[] +OpenAI/gpt-oss-20B,filter-js-from-html,5,"['9e8a65a4-341a-4191-b20e-b19282e522c3', '9ef00f16-ed04-43ab-a38c-cf44c5f68db1', '901e125f-f6c2-448d-abb4-e68ec54b135c', '86ae226e-e887-4b5e-8180-749d1d2bfc54', '8891dd1c-48f2-4c4c-ad0a-011b8107999d']","['filter-js-from-html__FxcDsoU', 'filter-js-from-html__9qYZ6Vn', 'filter-js-from-html__b2zmUXY', 'filter-js-from-html__9nBBMSW', 'filter-js-from-html__d2mYY6H']",0,"[362.813859, 23.847287, 312.836902, 12.630612, 30.840991]","[61.018757, 44.990125, 43.23453, 23.081222, 32.105422]",0.0,False,[] +OpenAI/gpt-oss-20B,financial-document-processor,5,"['793c9421-dbf2-43ec-b371-98c8abf8e397', '9268506e-45bf-4157-8513-26dd0f6c57c1', '2d8ee2fc-2016-4245-9a1e-1d3ac4749918', 'cfd19a89-1abe-4c5c-9012-cabfa936a0b4', 'fdcd4aad-a898-463e-a532-5a40cd5a9e28']","['financial-document-processor__Xd6vrBu', 'financial-document-processor__jQqck9d', 'financial-document-processor__gPLxgKq', 'financial-document-processor__FWoiEtv', 'financial-document-processor__KxDW7wN']",0,"[45.209994, 128.282891, 76.534794, 99.55459, 100.421997]","[47.511469, 29.593382, 194.013943, 64.10166, 136.656089]",0.0,False,[] +OpenAI/gpt-oss-20B,fix-code-vulnerability,5,"['a1875ad8-1a4e-4f8a-8050-686003be6920', 'b88bd526-aea9-4290-91d6-14fa1cd84bf1', '2ea58c60-b0c8-4e9b-a5aa-2f4958ba1bad', '3d39b1b7-6f24-46d6-bf79-23703ede6295', 'a49fb737-4705-462a-96f3-1544614fa7cc']","['fix-code-vulnerability__qYsvPL6', 'fix-code-vulnerability__uj7Em59', 'fix-code-vulnerability__PYVsTta', 'fix-code-vulnerability__Eg7Dfj3', 'fix-code-vulnerability__ujgGuoL']",0,"[904.798113, 906.414627, 982.462561, 1013.047545, 900.024056]","[9.812766, 4.639908, 44.250446, 82.131512, 19.827374]",0.0,False,[] +OpenAI/gpt-oss-20B,fix-git,5,"['c8e6a74b-a916-4ac5-94e3-15bbe499d3c3', '336786f3-44e9-4241-bb51-282b3bfca6c3', '55e27864-033f-4863-b2fd-2c0fadc49d73', 'f982da4b-04b2-4db7-83fc-467ad22d635d', '1e2e71c0-1c83-46c4-88a9-59e58336cc96']","['fix-git__VDdegzx', 'fix-git__swFKkjp', 'fix-git__L3bcJpN', 'fix-git__H6xzpqQ', 'fix-git__rad5ZgC']",1,"[911.780632, 256.074607, 103.285848, 153.742197, 91.160401]","[21.172295, 52.462312, 46.707654, 51.839512, 40.53448]",0.2,False,['1e2e71c0-1c83-46c4-88a9-59e58336cc96'] +OpenAI/gpt-oss-20B,fix-ocaml-gc,4,"['eb30c74b-1c11-4009-b244-0677bdd2ca51', '2eb2a5c6-a060-4a4e-a0f4-42b8a04e8e2c', 'bbd68584-8d73-4538-a6e8-0b466cb4dabf', 'ea6014af-ac3f-4ead-8747-bc79e988f823']","['fix-ocaml-gc__KcoJThg', 'fix-ocaml-gc__PWi7yN4', 'fix-ocaml-gc__EyKDpx5', 'fix-ocaml-gc__bsNScfB']",0,"[197.872133, 587.239527, 189.782575, 3600.737771]","[57.934679, 32.256836, 123.022945, 268.272578]",0.0,False,[] +OpenAI/gpt-oss-20B,form-filling,5,"['5e1c948c-844a-4a8c-8365-a0fbb4e59453', 'dcacb5e0-8329-490c-8a9f-730e0e2a6202', 'ab35bc21-50bb-49b3-8320-275df99d315e', '7b2234a6-f38f-4ffb-9fe4-374651004adc', 'd56f6a1b-b9c1-49a2-9dea-38e180430db7']","['form-filling__LuYX6KM', 'form-filling__FFPjYCt', 'form-filling__qgLJDhz', 'form-filling__tu42s73', 'form-filling__ie3DEjC']",0,"[107.531632, 178.350158, 60.368895, 187.701452, 906.36875]","[39.693382, 56.548834, 3.529811, 4.151272, 23.255559]",0.0,False,[] +OpenAI/gpt-oss-20B,git-leak-recovery,5,"['ba1cb721-476c-4678-b6d9-a32c574299f9', '56dc328c-31f0-410c-ac75-12da0e370794', 'a61f3994-527d-4adb-8aca-fc1eb3c11d24', '45d4a871-c0d3-46a8-bf94-b396141700ea', '6e1012e9-d93a-4f4e-afcb-485424525ae2']","['git-leak-recovery__Eq4u6zS', 'git-leak-recovery__RxNLkkN', 'git-leak-recovery__U8vHMxZ', 'git-leak-recovery__HW28HQy', 'git-leak-recovery__7RtnviP']",0,"[98.778482, 254.141303, 29.240326, 106.92239, 159.565248]","[68.294551, 51.519612, 182.66139, 79.375878, 63.326485]",0.0,False,[] +OpenAI/gpt-oss-20B,gpt2-codegolf,5,"['bfb9b1fc-26f4-42e1-b2d3-a49bbadf4b95', '82d01940-7c56-4554-aa39-595ae80879a5', 'e90c74f8-8785-42e4-97cf-b377cc708d7d', 'e45353e4-e3b0-4389-a617-843ac953c8c7', 'da53f72c-0961-4c90-9fcb-bc6427559a75']","['gpt2-codegolf__iTgSEsv', 'gpt2-codegolf__Cp2MhNB', 'gpt2-codegolf__s4soDrf', 'gpt2-codegolf__mW5zDQs', 'gpt2-codegolf__dxsFrRX']",0,"[774.970246, 910.717093, 10.965606, 210.674505, 902.115949]","[99.741873, 47.927244, 36.400425, 155.123884, 130.234032]",0.0,False,[] +OpenAI/gpt-oss-20B,hf-model-inference,5,"['45f5468c-e184-4704-8a82-118e3cf6c0d1', '7eaf2575-5a2d-44e1-bd1d-8d5ec64bf32c', '063dbee8-7e63-4b3c-a5eb-5e5623214906', 'c61ad51e-9a6c-4085-94fb-66925868beba', '5f351a46-6d51-4254-9daa-c74ecf3f2d92']","['hf-model-inference__Lhwzmsh', 'hf-model-inference__GA3Xcqi', 'hf-model-inference__fGUSTKN', 'hf-model-inference__GFw3UaV', 'hf-model-inference__WWr5EtL']",2,"[129.096941, 66.961364, 156.540089, 905.219522, 238.969891]","[25.932999, 40.918274, 46.388818, 40.000748, 26.044514]",0.4,False,"['7eaf2575-5a2d-44e1-bd1d-8d5ec64bf32c', '5f351a46-6d51-4254-9daa-c74ecf3f2d92']" +OpenAI/gpt-oss-20B,install-klee-minimal,5,"['a0021cd1-27b7-40af-beb5-95c435a72b9d', '49d27d7b-c31b-404d-8dc0-10304583cfa9', 'd7bfb42f-de75-4c2c-be83-ce71a305d884', '9a82236c-73aa-4933-9072-6170ec8f32ab', '5e4c0b84-e784-4546-9881-c8dc44e5abb1']","['install-klee-minimal__dyPLtCU', 'install-klee-minimal__fCwAg7q', 'install-klee-minimal__nSt8A8a', 'install-klee-minimal__4ZUEvLL', 'install-klee-minimal__wS4HocK']",0,"[507.812452, 912.707267, 132.403881, 472.458872, 233.394304]","[173.406265, 103.689194, 90.161779, 77.480307, 149.475199]",0.0,False,[] +OpenAI/gpt-oss-20B,install-windows-3.11,5,"['64931b53-228e-46a7-aa3a-1526a1b8d21a', 'c35a1676-903b-406e-af91-f0375f114072', '7b56cb74-5bd8-4174-a21c-46d1db75dc75', 'd533451c-1bcf-4296-b702-3cc9dbcf5a72', '972a00a6-60a6-4ec3-928f-199ea182a3d1']","['install-windows-3.11__u8Md8UG', 'install-windows-3.11__ZhB93ch', 'install-windows-3.11__CkYbfT6', 'install-windows-3.11__e2koycA', 'install-windows-3.11__7eK4R49']",0,"[186.712339, 39.093198, 243.355714, 3606.884224, 1510.922286]","[14.194608, 30.558615, 118.808968, 39.656993, 25.952671]",0.0,False,[] +OpenAI/gpt-oss-20B,large-scale-text-editing,5,"['6ab32e2a-c3d4-447b-ac01-11ab0712d5f0', 'b8c86452-c159-4f72-9021-5620fb5877fc', 'b3af42e9-65f6-4234-9ff0-2cefa8e50d48', '1b927bd5-a0d3-4364-b630-1f7e80fd9e28', '3adbea08-93ea-4db0-93c1-1d3e809c0cd3']","['large-scale-text-editing__rrzYJPf', 'large-scale-text-editing__rPB2EU3', 'large-scale-text-editing__Wpyfh2C', 'large-scale-text-editing__KC73e8U', 'large-scale-text-editing__i9pnnfs']",0,"[51.851568, 218.138787, 192.586515, 1238.868658, 115.260378]","[75.966265, 156.729157, 43.484625, 128.902189, 20.07828]",0.0,False,[] +OpenAI/gpt-oss-20B,largest-eigenval,5,"['76cecade-671c-4521-bd1c-28b05718238b', 'a5bc764c-9b04-4ed7-bc2b-81d75b416966', '448fc72d-8763-484e-ac7e-ca04df78b9f2', 'f7208ee3-1cda-4070-892d-204c5b8d6e3c', '08622f25-0d54-4aea-b380-6b7dab1d94f0']","['largest-eigenval__ACktBH3', 'largest-eigenval__PiGYWqf', 'largest-eigenval__n3cNQqo', 'largest-eigenval__uX3e7XP', 'largest-eigenval__AfqfoL5']",0,"[165.682031, 30.447841, 87.474697, 210.989092, 45.439537]","[51.655657, 20.178508, 176.067123, 127.547307, 9.015836]",0.0,False,[] +OpenAI/gpt-oss-20B,log-summary-date-ranges,5,"['efdc5c20-1718-47b6-a2b0-32fb91316324', '89d626cc-dd10-435f-84d8-5f6ce239d420', '1fc36c0c-9446-4d39-885e-efa9318ddf08', 'b39ba18e-5c9b-466f-af75-b92ae040c483', 'fed0226a-8ea0-4871-8033-7aa26322c6c8']","['log-summary-date-ranges__FqHFTeN', 'log-summary-date-ranges__tqiSoKt', 'log-summary-date-ranges__jN3iK5q', 'log-summary-date-ranges__W5SLP4f', 'log-summary-date-ranges__82sWPqG']",0,"[100.720318, 237.287327, 70.176661, 248.833063, 52.304569]","[46.008606, 13.12906, 56.270167, 37.701225, 16.888224]",0.0,False,[] +OpenAI/gpt-oss-20B,make-doom-for-mips,5,"['3e855e2b-0bdf-4f53-9db2-804d20315d0b', 'b26ca7ce-077f-40ab-8184-f7941fe9004c', '0294ef5b-3b04-4640-a9ed-dbc7bd635c20', 'd3f409e7-2c2c-4af2-85fc-462581211307', '66da4493-692e-4994-b2c2-b643413bb672']","['make-doom-for-mips__oao2v4d', 'make-doom-for-mips__UsXvxEP', 'make-doom-for-mips__BZhDKKu', 'make-doom-for-mips__9GEckft', 'make-doom-for-mips__EPjaGaQ']",0,"[903.622876, 908.142126, 1001.54888, 350.095345, 917.600996]","[137.677545, 29.67371, 140.584501, 93.324024, 58.319687]",0.0,False,[] +OpenAI/gpt-oss-20B,make-mips-interpreter,5,"['ee777adb-bd45-4d0a-811d-3814eaae0c3d', 'f6a4a0f7-99ac-4714-ba7a-d2a2c2b303d5', 'd2987b53-5eb3-489c-860e-497852477770', '9ae38130-a5d9-4d32-92ba-3b0031549ab2', 'c4dbba28-aee0-47c5-b50b-b07b2d88c58d']","['make-mips-interpreter__YrzgGvX', 'make-mips-interpreter__ysadGQq', 'make-mips-interpreter__XxExAgj', 'make-mips-interpreter__2FpoXyT', 'make-mips-interpreter__cr5aGVz']",0,"[1807.920061, 398.553723, 1816.206139, 1806.003414, 2058.869895]","[70.732603, 53.300231, 243.55586, 11.26189, 20.892769]",0.0,False,[] +OpenAI/gpt-oss-20B,merge-diff-arc-agi-task,5,"['3e744871-e3a7-42ae-8c36-e15d6218105a', 'eabfef9d-eafc-42e7-9724-16d9569da1d4', '61ef7093-b1fa-4d69-9ce6-92721df3d9da', '68d460e9-ba62-4b1b-8064-f2f5461eb415', '6d8ef277-cebf-41e1-80ac-45f337a26299']","['merge-diff-arc-agi-task__sMCobWq', 'merge-diff-arc-agi-task__HbGhNfn', 'merge-diff-arc-agi-task__6KSCzh4', 'merge-diff-arc-agi-task__cEpWaHB', 'merge-diff-arc-agi-task__qWyXeSX']",0,"[60.228993, 907.238202, 900.320443, 152.628457, 128.028064]","[17.89496, 84.626604, 92.717227, 28.997556, 80.717204]",0.0,False,[] +OpenAI/gpt-oss-20B,model-extraction-relu-logits,5,"['df251c62-6bce-4c8b-9655-df615dd1a2f4', 'ab2fd17a-7de8-4a23-88ad-9f91a509c143', 'e8ab8e51-c1b7-4b15-84fd-0496f67529e2', 'c470baf0-d1a3-452d-bb8e-cb4f1941b615', '9ee6a853-0115-4891-a482-163cccd25060']","['model-extraction-relu-logits__UvxNQHp', 'model-extraction-relu-logits__SKCLsgP', 'model-extraction-relu-logits__hjmWjxv', 'model-extraction-relu-logits__rKwj5oN', 'model-extraction-relu-logits__nYPvThf']",0,"[101.382685, 224.200182, 1421.58791, 27.105275, 123.24147]","[37.760407, 128.655282, 14.321979, 13.150289, 44.507943]",0.0,False,[] +OpenAI/gpt-oss-20B,mteb-leaderboard,5,"['2d59f02d-79d7-4769-89dd-50f34083e522', '7ec961ee-caa6-48d0-92af-a669881b3746', 'a7167d17-ee02-404b-b27a-fb286dee49a6', 'ac806f83-435c-4263-a6d1-f5cde8caea93', '12e800fb-c1ee-45f8-8d7c-e5543f6ac8e1']","['mteb-leaderboard__DtsojtY', 'mteb-leaderboard__RFDrnFL', 'mteb-leaderboard__CrMBVQF', 'mteb-leaderboard__4yzzUBn', 'mteb-leaderboard__chNubzm']",0,"[97.476365, 29.463283, 337.763497, 32.60288, 4.127515]","[78.221773, 4.659153, 10.653433, 41.386155, 5.057148]",0.0,False,[] +OpenAI/gpt-oss-20B,mteb-retrieve,5,"['6c9ffc91-df45-42ea-a4e2-a148e8d02358', '6fba9039-2326-4468-8474-0e2ddad0ca61', '45fb27e2-e098-4c09-b6c6-1f1c99f0323f', '3c0c81da-1f35-4a31-9c3c-cce417ea4545', '14c1c7df-3daf-428f-a914-42f56c86f865']","['mteb-retrieve__bimhxbY', 'mteb-retrieve__8jVMQVB', 'mteb-retrieve__LBUkmBx', 'mteb-retrieve__A57Tm2D', 'mteb-retrieve__MDoNPBB']",0,"[59.895487, 171.410954, 163.02571, 576.392569, 149.596764]","[10.01986, 5.771257, 43.053541, 12.930355, 31.633151]",0.0,False,[] +OpenAI/gpt-oss-20B,nginx-request-logging,5,"['c2385ee8-b2d3-4c06-b743-d5efde999f1b', '58f64bdf-97eb-4227-91c2-31198d5cfe9d', 'c1c87db3-b5f9-47fe-9734-89478e1cbdd4', 'c1e43537-c001-4206-8bb9-50256a6101df', '67ae6ce5-6de7-4bab-92ed-eea54262aadd']","['nginx-request-logging__HwEVA78', 'nginx-request-logging__X8W6dDk', 'nginx-request-logging__h9fCjkh', 'nginx-request-logging__5p59Pos', 'nginx-request-logging__oMiiFPL']",0,"[199.520646, 235.40418, 87.401822, 126.724406, 1036.412356]","[38.491198, 60.550964, 107.362146, 59.159701, 15.168884]",0.0,False,[] +OpenAI/gpt-oss-20B,openssl-selfsigned-cert,5,"['a5b84316-9b3f-49b5-9cd6-34cef6e02703', '90ddfb49-9480-4d32-8da1-4ef6dfb95e4b', '3875e65f-eafe-4a9f-aba6-30cab2c32547', 'd5bfd68d-bb07-4ac4-aa84-5db9e85c0885', '5083f31c-15fc-4147-99e1-0b02bd57079d']","['openssl-selfsigned-cert__Xy3WvG7', 'openssl-selfsigned-cert__y9U9dny', 'openssl-selfsigned-cert__zearvBS', 'openssl-selfsigned-cert__heUwSJj', 'openssl-selfsigned-cert__3ZjBKp6']",1,"[43.791773, 31.62658, 14.464017, 76.609029, 53.614372]","[35.893521, 27.702207, 28.072482, 17.554384, 24.201674]",0.2,False,['90ddfb49-9480-4d32-8da1-4ef6dfb95e4b'] +OpenAI/gpt-oss-20B,password-recovery,5,"['46a8f4a6-707e-46f4-b891-cbaadebe0613', '5ea83cc7-e311-4060-aa46-9fc26475888c', '92c3c4a2-3827-4778-b519-b20bd53c5d88', '96e567d9-321f-4490-a62e-22f6da435d14', '0788ec95-dbb4-476c-8844-ddaa10bbeede']","['password-recovery__KQSp5aY', 'password-recovery__2ddbTzM', 'password-recovery__a69Lb7n', 'password-recovery__H6xybYf', 'password-recovery__fPiexMY']",0,"[408.20545, 183.070605, 87.003179, 80.332563, 95.814047]","[280.509672, 25.076574, 36.284748, 35.560526, 36.526333]",0.0,False,[] +OpenAI/gpt-oss-20B,path-tracing,5,"['955dd949-ce74-4963-b2bc-68d40ea37c0e', 'd2eeb2f5-eed6-418c-8719-d0e731de67a5', 'f8c7c687-15a0-484a-b782-643a254ac90b', '03b30e27-1968-47c1-a5ab-5a79f4ed2070', '9de18010-b7ef-4297-9314-0394eff7277e']","['path-tracing__wtqd8AZ', 'path-tracing__fC3Ev2X', 'path-tracing__Jtot6sz', 'path-tracing__sVuvCLY', 'path-tracing__zj8Htia']",0,"[136.590739, 904.008497, 447.297145, 1800.565119, 1823.319191]","[66.426799, 259.244765, 7.321174, 77.610276, 37.225009]",0.0,False,[] +OpenAI/gpt-oss-20B,path-tracing-reverse,5,"['5140980b-cefa-44e9-9629-efd7676146e4', 'b5c0108f-7418-4fc4-a254-6e23d6f39a15', 'a1b7e64c-a453-4ced-bbc3-b487f50beb48', 'c125a170-7f90-45af-92a6-9eaa937e06bd', '2627ebe4-7093-49a3-b7d8-52c1459a3272']","['path-tracing-reverse__HHUrUPH', 'path-tracing-reverse__X29mtNv', 'path-tracing-reverse__q6fLxKE', 'path-tracing-reverse__syPiJvS', 'path-tracing-reverse__bF6eXLV']",0,"[89.028523, 313.094215, 933.841408, 241.013619, 1809.183015]","[49.756084, 51.61466, 63.739715, 37.775769, 38.260554]",0.0,False,[] +OpenAI/gpt-oss-20B,polyglot-c-py,5,"['0a849189-66e1-4a06-b4a5-41812f1dd8db', 'e3611a25-15fb-4f34-a966-71e930cfbeab', '4161c192-3809-4bd8-958e-d3c8236c3d4c', '9c6e739d-7605-45bb-b01d-ee01a4df663f', 'f4bdb963-1997-4d0a-8244-17c79ab3529f']","['polyglot-c-py__CU88n9E', 'polyglot-c-py__nTiVvVT', 'polyglot-c-py__gECas2u', 'polyglot-c-py__unt5fXG', 'polyglot-c-py__TftxBXj']",0,"[26.514535, 105.069729, 156.678424, 87.36403, 169.126195]","[17.361176, 18.343838, 42.534376, 48.855061, 98.783812]",0.0,False,[] +OpenAI/gpt-oss-20B,polyglot-rust-c,5,"['00265c1a-6913-40d1-98bb-cb160f2425b3', 'c76fac31-7b71-4ebb-a593-c72fb75245d9', '09c22d0b-f237-40c9-9152-4aebe9883106', 'e8f20704-2040-40dc-bf5d-37ef477c3b60', '1abc30ff-c2e7-419d-9140-77bafb5b886b']","['polyglot-rust-c__zxdLsPw', 'polyglot-rust-c__b6nwZGo', 'polyglot-rust-c__k6YZavh', 'polyglot-rust-c__Pz4K7eP', 'polyglot-rust-c__bTrHT6p']",0,"[65.929719, 287.065675, 115.479496, 324.601154, 900.017177]","[30.553962, 110.054438, 27.873105, 367.861364, 64.049838]",0.0,False,[] +OpenAI/gpt-oss-20B,port-compressor,6,"['7b5f3c52-ed5d-4e94-bd10-04944d2fafa3', '429fe3be-ca47-4df1-a119-4a63b19cb6d5', '0f680b06-2d72-4618-998d-51a244056a70', '3e901893-2123-490c-899a-5eff7e3d63a5', '81452652-ab8e-4c87-a3c6-47fc9ab257d2', 'f4408203-2fa1-4ff7-8a1e-789b09c7e567']","['port-compressor__KvCfgxL', 'port-compressor__3EGAkpb', 'port-compressor__RCnkkUt', 'port-compressor__9jPwScY', 'port-compressor__Karjy6c', 'port-compressor__NsaMXpY']",0,"[3600.001354, 1137.426176, 324.349625, 3618.353702, 413.329541, 3600.039148]","[22.389629, 39.354576, 14.9444, 49.5332, 13.375094, 71.120404]",0.0,False,[] +OpenAI/gpt-oss-20B,prove-plus-comm,5,"['cae9f70b-5a9d-496a-9dc0-8cd8a818b62b', '3444cf90-0da6-4132-90e3-965cc6257dda', 'ebc0531f-b318-47c4-90c7-043b67485cc8', '0fc82369-61f1-442e-bb17-a7046f9bc3c3', '6d1ad3fa-5d9c-49f6-838d-a4cb7ba0ceb4']","['prove-plus-comm__c4EfXhj', 'prove-plus-comm__r4WdnnT', 'prove-plus-comm__T4t2zTB', 'prove-plus-comm__cudSduM', 'prove-plus-comm__BWxMeGX']",0,"[81.375598, 60.608726, 128.742029, 91.306081, 176.746637]","[26.012853, 20.182458, 59.987978, 60.449329, 26.368493]",0.0,False,[] +OpenAI/gpt-oss-20B,pypi-server,5,"['6123c128-f4e2-4575-beb7-18c6d37ac3da', 'e549c06c-2316-4319-b788-471d31311f92', '84a66352-d4c9-49fd-83cd-29d0cd71a38e', 'd1c33182-4f99-4162-9ac4-2694a2e36faf', '3ce1c433-dc09-475f-91f8-1c9bf1adc942']","['pypi-server__p6T4Vfc', 'pypi-server__RX7aTUC', 'pypi-server__kQqSBqa', 'pypi-server__6ciGU46', 'pypi-server__zKrV9gz']",1,"[54.839259, 190.194728, 243.136054, 494.924042, 207.007948]","[50.679363, 35.296106, 25.899545, 71.669067, 14.454779]",0.2,False,['3ce1c433-dc09-475f-91f8-1c9bf1adc942'] +OpenAI/gpt-oss-20B,pytorch-model-cli,5,"['59204e86-ce9d-4ffd-a483-16166feb1b11', '11e2bc41-acf9-47c3-9e9b-ec758c61c529', '9b6eac77-21b8-4a70-8b9a-77657693efd6', '86585e68-632e-4ea5-8fe0-f1e7674894fc', 'd8c24f23-a54d-4ab0-9f4e-3def8991fd93']","['pytorch-model-cli__TRM8qao', 'pytorch-model-cli__UB8NS5h', 'pytorch-model-cli__cSXRk3W', 'pytorch-model-cli__LAXkPBF', 'pytorch-model-cli__WehyYhX']",0,"[231.397258, 89.057138, 125.023286, 73.313045, 27.416625]","[133.819936, 46.608223, 134.059502, 95.36866, 28.073967]",0.0,False,[] +OpenAI/gpt-oss-20B,pytorch-model-recovery,5,"['b60b1632-07b4-4154-ab1f-ce7b6b812d03', 'f03b45d5-6407-41be-a73b-a770d3f42327', 'c9def2a7-04c6-4772-aae9-c28ee2af7d05', '68cdc892-e64f-4900-a868-cd1783c29052', '77c0bb18-fe71-4d18-aa9a-c3479ad29348']","['pytorch-model-recovery__S6yq5dd', 'pytorch-model-recovery__LhqVBwT', 'pytorch-model-recovery__4t5nL49', 'pytorch-model-recovery__kKsAdUU', 'pytorch-model-recovery__z5NdLyJ']",0,"[915.069511, 905.398722, 81.888132, 909.177927, 900.959363]","[11.692028, 51.861133, 60.582227, 46.192584, 70.210508]",0.0,False,[] +OpenAI/gpt-oss-20B,qemu-alpine-ssh,5,"['d3ff7723-523c-4868-a5e4-9b0e23e2b571', 'c753c4a6-cd09-4661-a6cd-1e888f7ddb0d', '425b45f3-b832-4134-bd51-012e72299d4b', '9bc01c59-3d10-4014-a7a3-6fb702755c5b', '183629c0-2a41-4b88-a2cb-dfd5545393f4']","['qemu-alpine-ssh__s9E4gWR', 'qemu-alpine-ssh__sSQdUPD', 'qemu-alpine-ssh__45pRFnp', 'qemu-alpine-ssh__9tKhsRd', 'qemu-alpine-ssh__i4Nsk7r']",0,"[238.233703, 102.47707, 118.064231, 61.027218, 1046.027955]","[28.170269, 4.719013, 4.329629, 7.380716, 4.172096]",0.0,False,[] +OpenAI/gpt-oss-20B,qemu-startup,5,"['761d588c-a9b6-4ce8-87ee-27c6ec8d6851', '2833003f-73f5-44b2-a86b-60481d610544', '00f79366-76ce-4807-bbae-689c2ff19ad2', 'df957d08-02e9-4bc0-acff-7610730cb2f5', '41abb8d2-14f3-4af4-9feb-6cf4305f2d4c']","['qemu-startup__Qu5as4z', 'qemu-startup__QiN8PgV', 'qemu-startup__YgJGnm9', 'qemu-startup__jeSjP2K', 'qemu-startup__Tvss3cY']",0,"[43.907312, 39.335629, 114.005648, 900.076557, 510.358335]","[13.426351, 4.682651, 3.697756, 11.73376, 32.996446]",0.0,False,[] +OpenAI/gpt-oss-20B,regex-log,5,"['afa1fbae-92d2-4a9a-9ed0-1ab236009e69', '19d933d3-b866-478f-aef3-141ad7f526bf', '9f55c0ed-f20b-4bae-91ab-a2ba8b618778', '6d63f1db-5ca1-4953-9266-8b6691cd2530', '10e99df9-b28c-4791-85ff-8f9bc2e8cef6']","['regex-log__23gxD7U', 'regex-log__MkAkPVz', 'regex-log__9M6d8br', 'regex-log__wtn4bze', 'regex-log__a6kUjKo']",0,"[48.893916, 152.851665, 66.696215, 102.965557, 73.828295]","[188.961285, 93.386924, 164.596575, 76.143045, 138.373579]",0.0,False,[] +OpenAI/gpt-oss-20B,reshard-c4-data,5,"['1db1dc95-9af0-4cf1-b72c-3eb59b9c4e7d', 'fa8cec37-d931-4136-ad63-0403853da8ae', 'e46396d6-e548-4394-ba05-cf6e21b2cd11', '1f9dd107-1318-4a1d-8898-c40995b6d292', '6f281982-0af3-430a-90be-ec525345663c']","['reshard-c4-data__rCfntyM', 'reshard-c4-data__sLdN5Eo', 'reshard-c4-data__tpVApN9', 'reshard-c4-data__h25aXyC', 'reshard-c4-data__7E59MKg']",0,"[150.391438, 122.426137, 114.110424, 125.623363, 56.930466]","[98.397033, 20.668352, 33.623106, 44.332779, 145.349253]",0.0,False,[] +OpenAI/gpt-oss-20B,reverse-engineering,5,"['6086d3d1-d440-417d-bcb1-c9ef62fa0140', '405b8434-64b0-4a90-8aa1-3cbf32cbc04e', '83b972dd-44b6-44aa-ae23-4295aa5f1ac2', '39b89f45-4be4-4f58-976a-004c9eeb02f3', 'f253e763-f23b-435b-b7cc-00e157c14410']","['reverse-engineering__GCFxGZQ', 'reverse-engineering__dAuf4YF', 'reverse-engineering__tAAoQRU', 'reverse-engineering__VViMcmv', 'reverse-engineering__Vu62Dbi']",0,"[1801.983972, 2030.025354, 457.261349, 343.11882, 1834.78771]","[16.582914, 33.314126, 190.988206, 56.400785, 56.558444]",0.0,False,[] +OpenAI/gpt-oss-20B,run-pdp11-code,5,"['115fbaaf-0a48-4bbc-955d-c8243d8e1277', '6c2f19d7-baac-4cbe-8e8b-5c7baa11ffc3', '1fdd1600-720e-4a94-a715-c36ec8007b84', 'e22a08e7-22a6-464e-a8f3-7d687b8ec7bc', 'fad47282-aed6-492d-8fdb-729409bae839']","['run-pdp11-code__GPoAShz', 'run-pdp11-code__qiK4Hh3', 'run-pdp11-code__WSnoCtc', 'run-pdp11-code__Ee2HCaz', 'run-pdp11-code__dxGzRqq']",0,"[1041.740275, 85.666112, 279.488057, 192.493951, 1002.170458]","[20.141693, 36.315954, 131.34532, 164.851782, 21.073204]",0.0,False,[] +OpenAI/gpt-oss-20B,sanitize-git-repo,5,"['daf5cf88-434c-4e51-9abe-26786ffb8be1', '4c371ac3-14e4-44bb-8910-f84850c938da', '5bfdf8c1-a281-4c50-b4b0-74ca6e15b4e8', 'b2ad017f-adf9-4b22-b31e-2335ede5dc87', '01c10362-c52b-4818-95a7-2b72996c3baf']","['sanitize-git-repo__xFYtKgw', 'sanitize-git-repo__kSyvNDP', 'sanitize-git-repo__qTWVkBe', 'sanitize-git-repo__w3kUVei', 'sanitize-git-repo__YH8c7XH']",0,"[102.378839, 52.370822, 102.413541, 223.962708, 173.568168]","[22.62574, 73.479837, 48.488024, 54.146418, 148.721391]",0.0,False,[] +OpenAI/gpt-oss-20B,schemelike-metacircular-eval,5,"['7fb74be7-02ce-495e-937a-880c7970e775', '356654b7-3186-41b4-be12-aad910568747', '8409492e-3e5a-4190-bb25-d05402226df8', '05fa808b-69c8-425a-ac10-7256f8915134', '5c3856ed-d43e-454c-b357-fce6cc12e5d2']","['schemelike-metacircular-eval__YLQDdez', 'schemelike-metacircular-eval__nbWkFeg', 'schemelike-metacircular-eval__4SQXvyq', 'schemelike-metacircular-eval__QyhLLYN', 'schemelike-metacircular-eval__aFnF4Nz']",0,"[83.828158, 110.064861, 176.998226, 41.529751, 48.781332]","[40.687824, 16.450318, 38.403265, 40.319914, 50.700628]",0.0,False,[] +OpenAI/gpt-oss-20B,sparql-university,5,"['1ac0e3a1-42a1-44bd-ade4-9d833c77b6e0', 'c78ac0ac-4e2f-459b-9de1-32abcd268740', 'f61fa8a5-ab5a-41ed-a457-ca9dcc147cb5', 'c4976abe-94ca-4a31-9292-bb77ad7e7a46', 'f74ca665-6f58-40c0-a87c-3818356c870a']","['sparql-university__G8gH98A', 'sparql-university__E4o6HMu', 'sparql-university__fn83pUJ', 'sparql-university__FH52aLo', 'sparql-university__mGSyYMr']",0,"[248.53364, 335.482886, 136.629269, 153.035339, 188.446694]","[39.287555, 87.534346, 67.11031, 128.452594, 60.143055]",0.0,False,[] +OpenAI/gpt-oss-20B,sqlite-db-truncate,5,"['967d02f3-8d5f-4599-aa55-2aca50b999e0', '6ea7ae37-00e1-4459-a775-a49cbdd7fcf2', 'aa83a5bc-d5b8-40fc-8454-ee84a5f9d40c', '2050eb82-ad25-44a6-b1c7-f90f113f823d', '4e9b5541-ab60-48df-a4ad-b1ad4daa74cb']","['sqlite-db-truncate__sB6LK6D', 'sqlite-db-truncate__cQydNW7', 'sqlite-db-truncate__k8jRhdJ', 'sqlite-db-truncate__6jjBbrZ', 'sqlite-db-truncate__UxoANUC']",0,"[49.392669, 246.880051, 78.374347, 134.062386, 140.089677]","[16.807777, 47.656133, 27.70803, 15.950653, 30.297554]",0.0,False,[] +OpenAI/gpt-oss-20B,sqlite-with-gcov,5,"['898e20a2-2f30-4d3b-beb3-f855059c4a42', '64d05522-b573-4fa1-b5f3-bb3a165e6cb1', '9aef684a-e4bd-405a-9932-d4ca61213515', '91184ff6-ac6f-4fcd-9eaf-ccd93ba8e9f5', 'b5b7d2e1-563b-473f-9676-a07f469c5a01']","['sqlite-with-gcov__jdxsMWE', 'sqlite-with-gcov__imrphRP', 'sqlite-with-gcov__E7qYsnb', 'sqlite-with-gcov__9Hn9hW2', 'sqlite-with-gcov__YuWq5FV']",0,"[164.473224, 900.741708, 911.820457, 192.055478, 28.521407]","[142.791512, 48.283721, 16.913518, 80.963453, 58.355322]",0.0,False,[] +OpenAI/gpt-oss-20B,torch-tensor-parallelism,5,"['4e265d2e-cc3c-4f7f-8686-c594eaf39f70', '0b39aa41-2fd9-41a1-811f-1d4498e0c9ee', '6ab0dc44-7332-4d0a-96f6-975bed736d10', 'df20efba-c0d8-4e72-81b5-6b1e6f4563ca', 'db6055f0-30ab-4002-96ba-2940d11a7570']","['torch-tensor-parallelism__eeXKRza', 'torch-tensor-parallelism__Z3LmSeE', 'torch-tensor-parallelism__BfjSUfQ', 'torch-tensor-parallelism__FzHeZMc', 'torch-tensor-parallelism__yxfUfAP']",0,"[113.232244, 110.700496, 72.891641, 30.224706, 37.545308]","[43.54174, 98.161873, 44.292294, 11.830021, 22.655705]",0.0,False,[] +OpenAI/gpt-oss-20B,train-fasttext,5,"['306a7098-d31a-4d50-ada2-8515ece2562f', '76f43fa6-deb4-4bd3-bc2b-239a45394e7f', '353f49dd-306d-4e36-9cd3-4f420cec1a14', '997ab650-31c3-47a2-9643-fe7eae37a508', '39a91c9f-52fa-4158-92ce-f51cdf553ba5']","['train-fasttext__qjmZ63K', 'train-fasttext__icsSUjz', 'train-fasttext__GKNgCU4', 'train-fasttext__9CsfUFt', 'train-fasttext__c79ypNs']",0,"[1764.887709, 3627.670412, 267.011545, 252.774943, 3601.535597]","[164.787591, 62.256556, 26.974231, 77.833897, 239.380392]",0.0,False,[] +OpenAI/gpt-oss-20B,tune-mjcf,5,"['012737aa-b210-4094-b666-af6d6677686b', '7e1914a3-f12e-4639-851d-a4293f6350ac', '640c25ba-22d0-477f-b1d8-a60350a9941f', '1a05eaf9-8fa0-456c-8ccc-111218efa518', '1ce0fe41-f1c7-4bc0-8d1c-94bafbc5cc44']","['tune-mjcf__mnG39Cv', 'tune-mjcf__LKtCd7P', 'tune-mjcf__2YanKWy', 'tune-mjcf__x3uVFus', 'tune-mjcf__g2XGShC']",0,"[900.050309, 901.769956, 900.031734, 129.569055, 961.024847]","[24.060426, 15.200173, 10.49118, 77.077999, 13.779303]",0.0,False,[] +OpenAI/gpt-oss-20B,video-processing,5,"['226ef884-f95c-4bcd-9819-5af4b59e1761', '78b95d47-1386-41de-97ab-202a491962bd', 'd93d4b90-685d-4b01-881c-e2fda359eaa4', 'f784c58f-84c6-4a24-ae6e-7010412fa287', '19b6f731-4d6e-4ed7-8a0d-b8dc1329b53a']","['video-processing__aUqLK3k', 'video-processing__x7mURyg', 'video-processing__T7ZXFJq', 'video-processing__MRrjCpw', 'video-processing__VGKnZWA']",0,"[73.400203, 250.272492, 126.6624, 99.775747, 67.445497]","[87.292586, 147.1617, 54.775425, 22.236024, 81.549687]",0.0,False,[] +OpenAI/gpt-oss-20B,vulnerable-secret,5,"['c7bd6d87-71aa-4122-b265-9dfb78ebfcda', '6cd0e534-5058-4a48-876d-0c3556839d7f', '447fa237-a571-4077-875a-0e06463593ca', '17a43245-37b4-4169-b107-622faa7a3906', '59b877cd-2dcc-4c41-899a-5538c3fd291a']","['vulnerable-secret__6jmhfTb', 'vulnerable-secret__9GzD3KB', 'vulnerable-secret__kpM9sQ4', 'vulnerable-secret__v92bXNE', 'vulnerable-secret__PNiK5cj']",0,"[900.319148, 911.566206, 154.991213, 70.706258, 900.965285]","[19.790586, 14.540984, 12.746065, 7.856905, 71.62874]",0.0,False,[] +OpenAI/gpt-oss-20B,wasm-pipeline,5,"['11a0bd98-5cd2-4fa9-8e23-b581bd0f71bd', '695faf9b-b8af-430e-a571-2a7cf773aa4d', '5f137981-ac3e-404d-831c-0fefd096fc2f', '40dc62c4-302d-49ff-aaa6-027d78becd3c', 'a9a418f6-96ff-4b0c-a07f-d690c26972f9']","['wasm-pipeline__BX5PXrs', 'wasm-pipeline__kF3Yb4J', 'wasm-pipeline__hGRUbtf', 'wasm-pipeline__DC4XeRs', 'wasm-pipeline__JXgMULt']",0,"[901.233305, 154.709775, 902.181148, 922.103355, 94.347954]","[21.208094, 26.406904, 26.18439, 10.76019, 8.960508]",0.0,False,[] +OpenAI/gpt-oss-20B,winning-avg-corewars,5,"['47e67633-e960-482e-a45a-b5f5f78a8387', '48b71008-c2b6-4017-bc13-2358365793da', 'f0358f4e-e4b3-4de8-bd5b-4404898f0a95', '9fd4419d-332d-4803-ac2e-3b01bfff5a3f', 'd7b1e31f-03e9-40af-b22a-431764db7c95']","['winning-avg-corewars__peKCCqr', 'winning-avg-corewars__2UzL2GM', 'winning-avg-corewars__Vfpikze', 'winning-avg-corewars__5shy6Ln', 'winning-avg-corewars__hwH3ahf']",0,"[231.737965, 53.578473, 57.29964, 40.792568, 85.712986]","[14.395799, 7.637372, 83.356874, 4.673759, 31.72082]",0.0,False,[] +OpenAI/gpt-oss-20B,write-compressor,5,"['70cffa09-6399-42a2-9e3d-008fbd1235c2', '2185e680-7be3-45a7-b474-e30a7c0d93ed', '616ac75f-f0af-4a56-87bb-8dbe5eb21356', '6b753aee-fa73-47a3-8cdc-f5db2db353b2', 'a1968094-28ed-479f-b65a-3053caf0afb5']","['write-compressor__FrKafnF', 'write-compressor__P9pBQgQ', 'write-compressor__HHf3JHD', 'write-compressor__GhLFZVq', 'write-compressor__Ur9cGdX']",0,"[1240.835153, 906.86461, 900.483195, 310.212859, 904.365829]","[214.884407, 26.196002, 33.03879, 31.7728, 42.543911]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,adaptive-rejection-sampler,5,"['73b85c2f-0203-4d56-a4a0-5da30bdad1fe', '5548f677-e049-4164-9c74-ae2309d1b26b', '4ad46ed6-f07e-41b7-abcc-0950a6af8b2a', 'e0092756-f974-48d3-9739-47acdd80b5ea', 'f11d05cb-fa50-4280-809c-79d3486cc1bb']","['adaptive-rejection-sampler__idA3XWe', 'adaptive-rejection-sampler__b5P4MaE', 'adaptive-rejection-sampler__6xRrGXM', 'adaptive-rejection-sampler__qgHJC49', 'adaptive-rejection-sampler__HDJABEb']",0,"[916.269919, 905.534168, 902.045639, 905.828396, 920.723752]","[38.655894, 69.904655, 67.67623, 121.368155, 230.960079]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,bn-fit-modify,5,"['d1ea99a1-4b18-497e-beff-344f90191fc7', 'f7f8a619-775b-4943-b928-b62e1f1b0a58', '6cdf559f-952b-46e7-8a4e-8980da5280da', 'd12ca302-b458-44bf-b928-6ddef204d9f8', '3afc8524-15b2-46d5-96b1-b150eafac367']","['bn-fit-modify__DALzR8U', 'bn-fit-modify__cXbxNKa', 'bn-fit-modify__fPKvs6F', 'bn-fit-modify__QpRvhwv', 'bn-fit-modify__UuGTTfC']",0,"[1137.643445, 766.836765, 1325.061114, 1332.206074, 2467.400514]","[70.235414, 198.082197, 21.467069, 60.181334, 14.912277]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,break-filter-js-from-html,5,"['6f0f7620-6e0f-40a2-8f47-e16b1ebb3a1d', 'dc624d64-5e20-4aff-ad4e-d45030dfba95', 'f8300148-1fe7-4dde-a160-426aea23a040', 'f1ce53fa-a70e-49db-9f18-837c764d047e', '6e012eb7-7a30-4e79-a408-0add1d7eb526']","['break-filter-js-from-html__853G3T4', 'break-filter-js-from-html__6H67yG4', 'break-filter-js-from-html__KXJ98A2', 'break-filter-js-from-html__5wyjhiH', 'break-filter-js-from-html__qmpisUw']",0,"[1156.883808, 1101.209751, 1220.476872, 1249.662433, 1203.661381]","[55.62424, 58.208278, 7.479212, 220.380089, 57.754358]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-cython-ext,5,"['44ab5543-e9e8-4f62-9ee1-b33c1d394ca9', '03ba89f0-1269-4708-a57f-2b6881a16b5b', '7ceca493-3cb9-4d35-9826-794cd42dae4a', '423b3398-db3b-4d1f-82ba-98e9b3080dd3', '06feebb8-4f28-4655-be1a-680275f1ab76']","['build-cython-ext__LnmDu4o', 'build-cython-ext__V6JJBAi', 'build-cython-ext__mF8Nzy8', 'build-cython-ext__sWG5hu8', 'build-cython-ext__GbMPV3u']",0,"[900.881575, 901.228377, 900.451124, 902.134841, 903.694718]","[134.705454, 144.962884, 12.299346, 44.250184, 104.457548]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-initramfs-qemu,5,"['e4dbfd22-bd05-4a4a-9dab-3b7d77445c71', '1b7caa96-896f-488a-aff7-6be227b82c8e', '5a9a9bc2-f373-4173-aa58-215555f92725', '134c0eed-f520-408e-8d5a-6a27d59d30ba', 'a80bb35e-fba3-4f56-90d8-1d5d82ae9f20']","['build-initramfs-qemu__SWn5Siv', 'build-initramfs-qemu__SAdkWjz', 'build-initramfs-qemu__cC5czQx', 'build-initramfs-qemu__KPRNGuJ', 'build-initramfs-qemu__JVC3Ptg']",0,"[874.222941, 501.99624, 902.984272, 534.182077, 900.70822]","[42.847117, 70.97044, 74.168843, 88.660363, 25.039711]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pmars,5,"['4d1ffb2d-ad00-48a6-869f-6f6418fa217f', '6eea71e2-c8c0-4eef-96ba-53e6ae258e4c', '45527d41-9601-46e0-b195-1fa35851a8c1', '9f08c12f-1a42-4314-976a-2168025736c3', '5fbe8bbc-cc8d-4e70-b4c3-063c931f99fa']","['build-pmars__b5Zx29E', 'build-pmars__YJY4PGb', 'build-pmars__uUgqP3Q', 'build-pmars__6f4fcGv', 'build-pmars__ncv5qkQ']",5,"[915.933456, 904.621618, 514.548414, 753.10938, 612.808052]","[10.036897, 37.246813, 3.423198, 42.630359, 3.681964]",1.0,True,"['4d1ffb2d-ad00-48a6-869f-6f6418fa217f', '6eea71e2-c8c0-4eef-96ba-53e6ae258e4c', '45527d41-9601-46e0-b195-1fa35851a8c1', '9f08c12f-1a42-4314-976a-2168025736c3', '5fbe8bbc-cc8d-4e70-b4c3-063c931f99fa']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pov-ray,5,"['040d3028-6b17-46a6-bdf1-818da5f3bd01', '8510a9ae-e849-4868-8491-7b69003589e4', '00a6522b-53a9-4afd-ab14-5ac298d3ed7d', '4d89ef5c-73d5-424e-8e70-5aaa54ca72be', '5c3ba37e-1a50-43fb-a46f-424b10803bc6']","['build-pov-ray__C6Fyxrj', 'build-pov-ray__YsJtzfr', 'build-pov-ray__3nKdeeo', 'build-pov-ray__zgzHQeP', 'build-pov-ray__ak4NhZ2']",1,"[1043.830663, 2985.378311, 3105.266429, 974.964822, 1993.775304]","[29.26344, 39.210149, 97.605934, 13.439236, 61.734134]",0.2,False,['040d3028-6b17-46a6-bdf1-818da5f3bd01'] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cancel-async-tasks,5,"['13e5bc0e-39ea-4aa9-82ab-704f3e182960', 'dc75b0aa-b489-438f-b107-4bfe4a68973c', 'eebed711-648d-4af0-b7f9-96286ddd4442', '9d965db5-b38c-458b-b1a2-17df6b98bf07', '9ce94d87-efc2-4f01-8025-e6089d5857c6']","['cancel-async-tasks__TyUxzLS', 'cancel-async-tasks__fhKEdXT', 'cancel-async-tasks__MgNddxr', 'cancel-async-tasks__AfXjDof', 'cancel-async-tasks__JQsjS87']",3,"[269.034483, 900.626118, 241.723907, 900.04131, 766.124338]","[48.517199, 179.189397, 58.780498, 88.504445, 47.988499]",0.6,True,"['dc75b0aa-b489-438f-b107-4bfe4a68973c', 'eebed711-648d-4af0-b7f9-96286ddd4442', '9d965db5-b38c-458b-b1a2-17df6b98bf07']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,chess-best-move,5,"['aacdbe1d-b4ca-49b1-93e3-ab27e5dba1c1', 'e58e20bd-bf09-4fc1-b9a0-bba488b438f2', '08a8ff7f-b681-4427-85a6-5fc5c4ecaeb4', 'fb6af8fe-c9b4-4a19-8989-26886ce467e2', 'b36aa925-62d4-4629-a715-223f7c7283f0']","['chess-best-move__aoKG8L6', 'chess-best-move__iE2mVtM', 'chess-best-move__c3GaxnL', 'chess-best-move__8pudX3C', 'chess-best-move__nYtjdm2']",0,"[820.276921, 322.225343, 744.059469, 78.995028, 905.009129]","[25.942332, 162.32634, 66.839441, 6.815274, 29.705427]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,circuit-fibsqrt,5,"['43edcb06-f3dd-413a-8283-39e6fc5f680e', 'e55d2084-c51a-4e7f-9d8c-130f8da953dc', 'd0c97676-7b11-4025-9c0c-a294941592db', 'fd2ea1f1-05ec-406a-ade7-8934683ce679', '499420d3-3e08-4f92-bb70-765a7187a3ad']","['circuit-fibsqrt__mRqSuQM', 'circuit-fibsqrt__tXu8wCE', 'circuit-fibsqrt__iYPgqfA', 'circuit-fibsqrt__UA8NpqE', 'circuit-fibsqrt__z6LARY7']",0,"[3615.228631, 3600.050767, 896.27068, 1050.939795, 1684.166755]","[23.324887, 27.110416, 28.300053, 16.960136, 148.10503]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cobol-modernization,5,"['3408c973-f574-4cd5-9135-13cf8f789daa', 'a450bbf0-4497-49ad-a62e-1677a75a99b8', '66702491-3acb-429d-819d-7dc3b15ffc0e', '5ab76039-41b8-4155-b348-f32ff5c8cce2', '879ee685-4c36-49e1-b774-d2e272962dca']","['cobol-modernization__RNcM92n', 'cobol-modernization__3cW7tjz', 'cobol-modernization__o4eEiUT', 'cobol-modernization__ThNkn9W', 'cobol-modernization__p6w3nqC']",2,"[668.916419, 918.382574, 900.009431, 901.554932, 915.06147]","[52.404084, 43.681594, 47.734556, 76.51417, 52.40257]",0.4,False,"['3408c973-f574-4cd5-9135-13cf8f789daa', '5ab76039-41b8-4155-b348-f32ff5c8cce2']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,code-from-image,5,"['95b1447f-94af-44e4-bf0e-2d3c1e93f571', 'f36962c8-fec8-405e-bd8c-3898e34c5998', '79693a76-7347-42f5-a9d1-4e6e14e72f61', '3cd86300-4a0a-4b72-83bd-fc2d03672e15', '64c01cb1-74ce-4008-95e5-add099ff32d7']","['code-from-image__ANZoDmR', 'code-from-image__yGSfYVv', 'code-from-image__H5sVsU3', 'code-from-image__ogfLFS4', 'code-from-image__ABJkdTV']",1,"[626.83562, 1204.802094, 991.873763, 322.815884, 820.332866]","[55.935748, 101.983159, 45.557034, 20.928461, 15.873096]",0.2,False,['3cd86300-4a0a-4b72-83bd-fc2d03672e15'] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,configure-git-webserver,5,"['2bb85130-9b8f-45fb-a35d-d8f8b6c0f1de', 'd5c42548-984b-4d57-bb93-ec1e0f3ec4dd', 'f317dcb5-71ec-4ebb-b064-d37bf0ade247', 'f4a92dd1-8e89-40ea-8866-45fef756e430', '2de1ebb3-c9f1-44a3-81b1-5b374965db82']","['configure-git-webserver__ahv7fTc', 'configure-git-webserver__wdkcHP4', 'configure-git-webserver__CYJ4q7P', 'configure-git-webserver__6mCjPiw', 'configure-git-webserver__wiSmQ2G']",3,"[627.071429, 609.395277, 900.290625, 900.518605, 668.713229]","[59.163743, 38.686079, 28.382164, 57.417791, 106.868322]",0.6,True,"['d5c42548-984b-4d57-bb93-ec1e0f3ec4dd', 'f4a92dd1-8e89-40ea-8866-45fef756e430', '2de1ebb3-c9f1-44a3-81b1-5b374965db82']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,constraints-scheduling,5,"['163b20ee-9fc2-45b5-8aae-a3624e1837f0', '5cb189ea-a335-41c5-aeb2-a025021a6aae', 'dc9909e3-9db6-46cf-b626-5a8a02d86427', 'b20a0562-1294-4e4d-8551-9879a2ce9aff', '865ec16e-2043-40be-ba01-02077e6f2043']","['constraints-scheduling__MP96gs4', 'constraints-scheduling__5HBKYKw', 'constraints-scheduling__guFJQDy', 'constraints-scheduling__6KdRiGm', 'constraints-scheduling__W2LCd3S']",5,"[702.942225, 391.861958, 1204.966363, 674.796837, 1129.035961]","[151.429807, 50.15613, 103.646591, 13.142175, 49.403904]",1.0,True,"['163b20ee-9fc2-45b5-8aae-a3624e1837f0', '5cb189ea-a335-41c5-aeb2-a025021a6aae', 'dc9909e3-9db6-46cf-b626-5a8a02d86427', 'b20a0562-1294-4e4d-8551-9879a2ce9aff', '865ec16e-2043-40be-ba01-02077e6f2043']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,count-dataset-tokens,5,"['11293f0f-1997-498c-b84a-af00a7eb8ab5', 'e3dfe3ec-e6c4-417b-8433-bfc9ab471995', 'ad96c00b-803f-4e0b-b848-aef3941a9bc2', 'ee94edce-4024-4e57-928d-1bc20d4db412', '97ea7eeb-c160-494b-a119-817c375eb442']","['count-dataset-tokens__dyVbjHh', 'count-dataset-tokens__Acq6RAo', 'count-dataset-tokens__Ert9Sxz', 'count-dataset-tokens__v8cRk8E', 'count-dataset-tokens__PWZCJHA']",0,"[740.905576, 900.323936, 906.8158, 660.523458, 932.418981]","[41.854146, 21.457513, 80.4219, 199.82492, 131.738845]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,crack-7z-hash,5,"['b24625f3-3305-496d-9200-0b7071eaf2c5', '65498ab0-8c5a-440e-b1f9-a4ce470026d6', 'a62d0bea-a605-47cd-a544-7404e67b5b71', '0e3d4498-59bb-493e-8c80-c890826a51b7', '01dc8b2d-4901-4e46-b50d-ae6b98b67060']","['crack-7z-hash__Bee2jrf', 'crack-7z-hash__aGbtYX2', 'crack-7z-hash__LjogwKN', 'crack-7z-hash__79Q7NTV', 'crack-7z-hash__J8SnKeA']",0,"[459.921733, 265.532981, 534.435145, 910.169873, 390.560703]","[7.506736, 46.467922, 27.732666, 131.84213, 25.142638]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,db-wal-recovery,5,"['1c72e7bd-15d9-4083-8d19-238f2b806d59', 'ad1bc51a-9353-48f1-9173-b94038eed24a', '6de63371-e49b-4bf4-b955-a4adf5ac9169', 'bf5c5796-6487-42b9-884b-8f691ed9a429', 'e4290f35-5807-4061-9b47-e032191b6763']","['db-wal-recovery__vAoxu2C', 'db-wal-recovery__VKMBX3z', 'db-wal-recovery__MDbS9C5', 'db-wal-recovery__P8E6AYP', 'db-wal-recovery__utkKvHY']",0,"[902.751639, 619.78663, 940.987152, 174.403243, 547.685419]","[26.824325, 26.413669, 87.897557, 8.112085, 24.695]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,distribution-search,5,"['fe0c050a-861a-407c-88b8-b7f067233e18', '8ac69219-6e09-4cad-922d-d0a024299271', 'c7280f12-74ed-48cd-a12b-83b016181e59', 'f56fe099-e01e-4440-89a5-da255386bf42', '75d95b08-130a-4e4f-a448-07d75f0a19f6']","['distribution-search__Vb6LEJv', 'distribution-search__yxmaarY', 'distribution-search__moQBsEQ', 'distribution-search__Kgxi9ZE', 'distribution-search__X7ouTjr']",2,"[534.762051, 685.730188, 1526.148199, 317.376645, 814.595259]","[26.035476, 145.422905, 206.575705, 46.829732, 49.068585]",0.4,False,"['8ac69219-6e09-4cad-922d-d0a024299271', 'f56fe099-e01e-4440-89a5-da255386bf42']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-assembly,5,"['5b5025f3-37f8-4a2f-8f12-2d6d0254cd8c', '2e05751a-d205-45d1-809f-f0b08d5c960f', '1faac076-907e-4c45-9e86-fd361c6067bb', 'c0a1191e-b461-4446-91cd-b6eecd3c17a7', '5d608d9c-58fa-4e6d-a287-05b3c1c97090']","['dna-assembly__dU3fevB', 'dna-assembly__Tcyjemx', 'dna-assembly__FndiAVd', 'dna-assembly__tN7mPGU', 'dna-assembly__euN6mB6']",0,"[738.789818, 756.249183, 730.336173, 748.774548, 720.210787]","[39.274943, 143.599891, 55.423753, 18.966921, 107.209481]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-insert,5,"['ea32f06a-ec71-4e67-957e-8463e4794b2d', 'd4c39c15-85d3-49f1-8f42-ee7522eaef00', '4becdaf2-ded7-4b93-b3d1-2a0197f8e31a', '808c2f0d-d7bf-4317-8288-6c2c209c3bf4', 'f8029e1d-ab53-4c8a-ac08-ea484c216b11']","['dna-insert__xg7wf8c', 'dna-insert__u9Cer2x', 'dna-insert__GXNhZWg', 'dna-insert__SC9kiTR', 'dna-insert__2N3ouXa']",0,"[395.821054, 373.498096, 374.011014, 630.574918, 302.344501]","[26.180552, 29.721959, 21.299436, 237.638034, 24.169242]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,extract-elf,5,"['f0be22db-47a1-418c-ba3b-1b00632129f8', '6d87c5d4-8d86-41e8-96ce-8eb2e6f9856e', 'f66e6d5b-d883-4258-927e-630c67613403', '646e2c95-f660-4eb3-9687-cb2a9c9d1815', 'b2dcf992-5e65-480b-83d8-c624b586164e']","['extract-elf__ZbzfDdH', 'extract-elf__Spjzd9z', 'extract-elf__g8XUKrc', 'extract-elf__8CEPuhP', 'extract-elf__y5iwD99']",3,"[365.057352, 739.631058, 598.281313, 775.699841, 651.489508]","[124.307501, 66.832781, 107.564076, 23.697628, 66.209362]",0.6,True,"['f66e6d5b-d883-4258-927e-630c67613403', '646e2c95-f660-4eb3-9687-cb2a9c9d1815', 'b2dcf992-5e65-480b-83d8-c624b586164e']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-differential-cryptanalysis,5,"['7e5a95f3-f02b-4dc6-a83b-9409f7ed21c3', '9caadcea-65e0-46c4-a4b6-7cd8b1bca2ed', 'edfb2ef8-16b5-467d-bd17-21336d7b113d', 'b8be46a6-ad64-44e1-93a4-f530eb59e722', '8d06c0ad-9258-48c7-b0cb-ff4932f77fd9']","['feal-differential-cryptanalysis__rU3WNSE', 'feal-differential-cryptanalysis__ZbYdSBj', 'feal-differential-cryptanalysis__ubwKDkB', 'feal-differential-cryptanalysis__YZsa9rz', 'feal-differential-cryptanalysis__SaU5nKz']",0,"[1348.891886, 2458.036714, 468.020863, 1560.852697, 540.398693]","[44.868646, 184.398798, 25.913284, 147.528527, 27.633732]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-linear-cryptanalysis,5,"['b7c4e7b1-a7ef-4e4a-ad61-abf3c9d88c8e', '0b1249b7-84df-4604-95c0-94a8ac7f2cad', '9a8b20b6-24d5-4e60-b57b-390e8230ab1a', 'c0bb5b47-b93d-4695-8b2f-a9afc96ca21b', 'acc93131-ea29-4366-a99e-142fbf9e742c']","['feal-linear-cryptanalysis__xdhfJRV', 'feal-linear-cryptanalysis__AnSAtsJ', 'feal-linear-cryptanalysis__Hc8Evub', 'feal-linear-cryptanalysis__dE5Phqk', 'feal-linear-cryptanalysis__D72hWZ6']",0,"[1836.86963, 1120.093766, 1819.064592, 1801.035769, 1246.268106]","[62.9925, 226.218139, 63.890466, 24.164392, 43.935984]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,filter-js-from-html,5,"['08ebdb3a-5d6f-4a70-aa50-0146188f0cc2', 'b56252ee-d633-4bd0-9bea-ea320aa08563', 'ee79d8b8-2b25-44e9-954a-aedb7a87a556', '95c37ddd-ff69-46a6-a666-18b591f41a7c', '98b58079-0597-4906-96e4-0cb22dc47b83']","['filter-js-from-html__XKfHxVP', 'filter-js-from-html__Sq3VMwN', 'filter-js-from-html__tw68Vgy', 'filter-js-from-html__VgzPrN2', 'filter-js-from-html__mBduM9m']",0,"[900.464949, 465.860672, 562.278109, 403.638001, 761.075136]","[43.82142, 32.035343, 62.164893, 59.291879, 44.150116]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,financial-document-processor,5,"['32643ad4-56d3-45b3-9ec9-156cf2dee495', '50bc0e4a-e2a7-4c25-905e-a6e988ee22aa', '41dfa544-50cf-4458-9542-a52b6c78115b', '26fccddb-85a4-441d-b623-333763be27c9', '8959f926-02d9-4785-afbf-4d15c5a990e4']","['financial-document-processor__sseYUcM', 'financial-document-processor__umCLGQ6', 'financial-document-processor__a6u2rDp', 'financial-document-processor__UQBwvSc', 'financial-document-processor__6CK8UbY']",0,"[575.294524, 513.325155, 216.610444, 740.859158, 874.378545]","[28.301239, 104.795215, 21.287336, 209.496923, 14.031965]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-code-vulnerability,5,"['b421b0f4-1d85-46bc-98c4-edacde5964b3', '9c941f45-1745-4981-9daa-7810f42a497a', '75785621-085c-42c0-8e81-a311e07ee265', '9d84a83f-581b-4b4e-a894-0a71697ebebc', 'fabc7c4d-ebe9-41ca-a53a-679445d95a55']","['fix-code-vulnerability__Xez82PF', 'fix-code-vulnerability__yDVa2iA', 'fix-code-vulnerability__zZF3bZi', 'fix-code-vulnerability__GEzTqoC', 'fix-code-vulnerability__6buQJKd']",2,"[908.555324, 900.661841, 551.125782, 947.507452, 900.248602]","[44.352346, 13.181787, 43.178595, 5.110335, 3.370596]",0.4,False,"['b421b0f4-1d85-46bc-98c4-edacde5964b3', '75785621-085c-42c0-8e81-a311e07ee265']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-git,5,"['566480d3-98cd-4f9b-a645-c9fb05491b44', '0acc683a-338b-457f-b9fb-a7d9f9d733a8', 'b93a28df-aa0a-443c-8e85-9196b91259a1', '63b58936-d21f-4de1-a68f-09b47b2b76e2', '2438e67f-0d78-4bea-b8a5-0e5c24eecc4d']","['fix-git__32X5PMf', 'fix-git__zea8AWS', 'fix-git__6TPScBS', 'fix-git__Cx7XzW5', 'fix-git__AoUZxhQ']",5,"[495.622287, 330.564566, 566.232465, 513.804644, 272.848379]","[22.550263, 61.45664, 39.50576, 43.37128, 19.571034]",1.0,True,"['566480d3-98cd-4f9b-a645-c9fb05491b44', '0acc683a-338b-457f-b9fb-a7d9f9d733a8', 'b93a28df-aa0a-443c-8e85-9196b91259a1', '63b58936-d21f-4de1-a68f-09b47b2b76e2', '2438e67f-0d78-4bea-b8a5-0e5c24eecc4d']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-ocaml-gc,5,"['18da6fcd-bb39-44cb-931a-ce6c65725fc8', '7c8dc744-ee69-4a0a-bcde-b49bc6706b54', '571ec257-dd9d-4d7f-8c59-f083668a729c', '2a842935-93e1-492f-bb3e-df9771f260a5', 'bbffa713-9fbc-4c3a-9946-f8a63fc3d494']","['fix-ocaml-gc__ZY5ec7t', 'fix-ocaml-gc__jshaZ25', 'fix-ocaml-gc__bTTFp6F', 'fix-ocaml-gc__BzLNeDY', 'fix-ocaml-gc__kn9TZq9']",0,"[3613.109713, 2571.597242, 1415.570426, 3606.099714, 3627.825435]","[121.94746, 24.002008, 44.190638, 79.651779, 28.941902]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,form-filling,5,"['db61f49d-ce3e-4f96-812c-9cb20d653a42', '5f4402b0-4241-49e1-8b78-38a99fe8b5dd', '42792c29-5e49-4367-80f8-2d7a357c5537', '517a614e-0f82-4994-9e44-f556732196a1', 'ffb2182d-2971-4505-a6c5-728ca507d3b5']","['form-filling__uevabVu', 'form-filling__zVzZbQ2', 'form-filling__6jngspK', 'form-filling__vC4kZfJ', 'form-filling__bDmKRha']",4,"[900.704781, 901.912502, 478.692785, 374.51275, 433.688985]","[9.830811, 100.905627, 5.883612, 4.65423, 10.996511]",0.8,True,"['5f4402b0-4241-49e1-8b78-38a99fe8b5dd', '42792c29-5e49-4367-80f8-2d7a357c5537', '517a614e-0f82-4994-9e44-f556732196a1', 'ffb2182d-2971-4505-a6c5-728ca507d3b5']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,git-leak-recovery,5,"['df7d3bd4-68d9-41ad-9134-6f7bee6839b6', 'c38990ca-d8d7-4995-9f45-0d9a0cc2a2e6', 'b8c14b87-b5b9-4737-9d9b-35fa732fd621', '4942d5c3-b892-4a38-a37b-8b5db6d04d8b', '6ac99586-2b2a-4998-aa9a-efb2375a54ce']","['git-leak-recovery__ATDJDuW', 'git-leak-recovery__ufueNfj', 'git-leak-recovery__qWWP6bw', 'git-leak-recovery__uUC7Bqa', 'git-leak-recovery__th2TW8T']",5,"[153.461073, 173.514018, 411.623186, 347.120535, 290.474758]","[52.837427, 177.95356, 76.742734, 70.48207, 87.53419]",1.0,True,"['df7d3bd4-68d9-41ad-9134-6f7bee6839b6', 'c38990ca-d8d7-4995-9f45-0d9a0cc2a2e6', 'b8c14b87-b5b9-4737-9d9b-35fa732fd621', '4942d5c3-b892-4a38-a37b-8b5db6d04d8b', '6ac99586-2b2a-4998-aa9a-efb2375a54ce']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,gpt2-codegolf,5,"['54a3a571-d2c5-4f78-8d03-2be7406f44e2', '5fdadff7-69a0-4d1d-b65e-3c40ff714fef', '9c1fbb70-5c2d-401b-bc44-a2b25e744687', '45b52d22-2f0f-4e1f-8049-351aa0cf95e2', '55cda5ed-9883-4b5c-8579-f555e695fe89']","['gpt2-codegolf__pAfWLKV', 'gpt2-codegolf__YbFLdzV', 'gpt2-codegolf__Mp87UHT', 'gpt2-codegolf__GsJ3ron', 'gpt2-codegolf__qb9oN9L']",0,"[910.802121, 499.48679, 384.661556, 276.500254, 904.096074]","[166.905545, 135.563991, 19.225045, 317.869845, 24.312536]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,hf-model-inference,5,"['c8b937df-3356-45ee-8b8a-53b464d80dd6', '0c0f13f4-ec56-40ca-bbcb-20b0cc7c6bc9', '9567cfd5-d7bf-489d-a188-251650d35caf', '6423921b-b1f5-43f0-a5d2-1f12b805a9dd', 'fd92f0a3-1a06-4d73-9dac-df1cbc970f50']","['hf-model-inference__Axy83aX', 'hf-model-inference__EjBa3Ki', 'hf-model-inference__ypfYggS', 'hf-model-inference__5j6Xckn', 'hf-model-inference__pDFXZiT']",0,"[573.637162, 925.986945, 342.102901, 334.198409, 582.349791]","[66.765994, 36.699767, 93.914018, 37.798128, 52.175726]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-klee-minimal,5,"['88844d79-705c-4a91-b046-d139020d8ace', '2763ed6f-98bd-4067-86ed-61529e1be632', '8aa6f73e-cd5f-4a4e-9803-79b853d93acd', '4f2f0d63-d419-432b-9d84-44b199b2f309', 'bee9440b-9253-4d69-8da7-b2d6ae9d6cc1']","['install-klee-minimal__DgkVrTu', 'install-klee-minimal__9VhcoRT', 'install-klee-minimal__rsQbtH7', 'install-klee-minimal__zVRC5q8', 'install-klee-minimal__KarrLB6']",0,"[900.02768, 900.000675, 1751.069716, 900.468381, 900.066762]","[29.252047, 91.247588, 128.612579, 65.755801, 89.571414]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-windows-3.11,5,"['ba2b9534-3641-4305-b940-d2ac1e7b3bd7', '8d2939e5-cb1f-4ee9-a00d-1e5dd56d39f1', '0aff3637-463e-403b-80cd-fb97af8c5493', '84c14f0a-0fca-4aa7-a9f1-ecf6f639be12', '51f929c3-0647-4c4d-b3b4-b301cc62a0b1']","['install-windows-3.11__GvMuarB', 'install-windows-3.11__vhSe3Gt', 'install-windows-3.11__tWyqHfw', 'install-windows-3.11__uthEgaD', 'install-windows-3.11__QH75tVm']",0,"[237.833925, 1203.25457, 1484.71183, 763.00718, 919.509702]","[24.550542, 117.392243, 45.416437, 63.489317, 62.968371]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,large-scale-text-editing,5,"['68198567-c72b-4ae6-8ce0-1fbf5a6ac135', '4b289235-81f9-4b0b-8d19-6da18dbb94df', '2dd96148-0cb9-443c-9ec0-98f42ab69b82', '7b30fbc4-b009-40cd-8b17-bad7ff090b74', 'd53e6d3c-524c-4dd4-9b99-8f433c6dc90b']","['large-scale-text-editing__h8xPsGZ', 'large-scale-text-editing__3z7EF7v', 'large-scale-text-editing__ZpGuKEf', 'large-scale-text-editing__zfuRZZ6', 'large-scale-text-editing__aucXXeo']",0,"[1211.410911, 497.648655, 708.316535, 1244.966098, 1200.509594]","[44.617962, 285.429827, 198.587364, 19.466645, 81.477909]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,largest-eigenval,5,"['bbfbdd21-7111-4e3c-b5dd-14c472fb6825', '10d932ef-09b3-448a-9137-c0d41d9768f0', 'e6161e63-53b9-41ee-872e-8441a6aa0f60', '60ee6912-7542-4d9b-b1e8-d290c6cfbb1b', '0c744cfe-aed4-4812-81b3-9f00ffdae064']","['largest-eigenval__M2NVA9e', 'largest-eigenval__qW4xJXD', 'largest-eigenval__mgvEgB7', 'largest-eigenval__VuAcyPq', 'largest-eigenval__5pHtWn3']",1,"[553.179561, 907.779643, 913.102286, 611.290803, 905.013828]","[26.379303, 352.4378, 110.863499, 42.710756, 132.159705]",0.2,False,['60ee6912-7542-4d9b-b1e8-d290c6cfbb1b'] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,log-summary-date-ranges,5,"['365dcd78-ce12-44a0-8d2b-99d43db43394', '2c356500-e109-47d1-8d8c-73db20b46c7f', 'a92e3751-ad7e-4a1a-8155-801e3208f1e0', '85bf8056-de9d-492c-af2a-de8efa81b2ea', 'edca92f3-d1d0-4226-ae43-4a3982e6e439']","['log-summary-date-ranges__iNfJdKY', 'log-summary-date-ranges__Suzpbyb', 'log-summary-date-ranges__JigRmPW', 'log-summary-date-ranges__AQXmZaF', 'log-summary-date-ranges__8YEgkTx']",4,"[393.691667, 190.140815, 200.016045, 338.196541, 290.677938]","[164.459261, 64.016464, 17.611356, 97.951553, 35.275292]",0.8,True,"['365dcd78-ce12-44a0-8d2b-99d43db43394', 'a92e3751-ad7e-4a1a-8155-801e3208f1e0', '85bf8056-de9d-492c-af2a-de8efa81b2ea', 'edca92f3-d1d0-4226-ae43-4a3982e6e439']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-doom-for-mips,5,"['ee769c80-10c2-4044-b47f-7dba3b045a17', '41ada0fb-49c6-4f19-aa0f-114e211b4bab', 'e87a402f-bf18-4b9c-96b8-3bf64a5f936d', 'f27753f4-b287-42e6-b84c-120f526d18d5', '493edcad-28c1-4f3c-b613-13748ee6b73f']","['make-doom-for-mips__zxruU46', 'make-doom-for-mips__cBiwkjX', 'make-doom-for-mips__MQEWfSm', 'make-doom-for-mips__vbhPoAs', 'make-doom-for-mips__AgT78aY']",0,"[919.006607, 901.00345, 908.157591, 921.348261, 900.025507]","[129.880884, 14.664119, 31.36829, 33.822388, 293.52921]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-mips-interpreter,5,"['5d676335-bede-4a46-940f-6577e9de7bf2', '65c38f1b-d693-453f-8006-8aeae9639884', '2922d35d-5727-44ed-85b6-9d7f1833b8b5', 'dddf66b4-b8fa-4885-a243-af8664b6dba6', 'a1828aca-94e3-4360-ab4f-fa4197ce1938']","['make-mips-interpreter__oCxwDTk', 'make-mips-interpreter__p2mxjZt', 'make-mips-interpreter__obF6mrs', 'make-mips-interpreter__ziuYT4G', 'make-mips-interpreter__vBkqLZ2']",0,"[1518.34756, 1800.226092, 4841.018785, 1350.749868, 1807.904752]","[44.614527, 48.679714, 10.959065, 126.306055, 71.607087]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,merge-diff-arc-agi-task,5,"['bd34762d-78dd-4358-a303-dfa71baa2f75', '47c4d818-7cca-4860-bc47-03c7f590d6b5', '19c5e3de-69c6-483c-ae52-714e6a95b1b6', '291d4605-6f73-42e3-b62c-245b63536a2e', '4ce53677-4b76-4d33-a901-034a0562418f']","['merge-diff-arc-agi-task__HSmQ9JG', 'merge-diff-arc-agi-task__VVnYtS6', 'merge-diff-arc-agi-task__tWHVcVg', 'merge-diff-arc-agi-task__BFLVvkt', 'merge-diff-arc-agi-task__nNbstZq']",2,"[277.19801, 912.495621, 725.307267, 926.567994, 388.994456]","[22.115007, 67.837854, 32.832069, 111.045407, 77.725364]",0.4,False,"['bd34762d-78dd-4358-a303-dfa71baa2f75', '4ce53677-4b76-4d33-a901-034a0562418f']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,model-extraction-relu-logits,5,"['53f8669f-7fe2-4244-af21-4aafe08a6e0a', '13b2b7d7-4c63-47a0-b38f-8f95e3b370ab', '3f11f238-54d4-4ac8-8582-51ede6a41a70', '49e34070-2538-4290-b4f8-e0d41b4cf5bf', 'b0f55a03-e631-47a9-b558-62a7d7b55c2a']","['model-extraction-relu-logits__zaxCka4', 'model-extraction-relu-logits__oEZCH9r', 'model-extraction-relu-logits__3aMdXuY', 'model-extraction-relu-logits__jp2iLsW', 'model-extraction-relu-logits__dSzSadA']",0,"[816.844789, 827.348843, 912.443051, 1150.099171, 498.651982]","[23.362053, 174.148277, 101.192577, 49.851901, 22.22118]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-leaderboard,5,"['47c2bdfe-3e1f-48c2-af26-3dcf61216345', '8105feba-7a00-46f8-84fa-bc7d9428e84e', '18dcde71-014b-4085-95fe-54390c344185', '70791c6c-9952-497b-a547-c92af3f188d8', '8c08453a-ae7c-47fe-bfd1-5a2282d00205']","['mteb-leaderboard__TVNwtnw', 'mteb-leaderboard__AL6ztAM', 'mteb-leaderboard__boQ4R4S', 'mteb-leaderboard__eYc7PvM', 'mteb-leaderboard__nLogM4R']",0,"[255.135219, 214.026758, 1869.325197, 509.635021, 468.001021]","[4.917682, 21.412262, 10.624288, 32.016028, 5.337509]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-retrieve,5,"['441619e3-540b-4963-acb5-80288d17c72c', '14542b18-5878-4215-a87f-575e8b0d57e3', 'aaac5bd2-2d9a-48ae-b23a-2f7db5e77c15', '0e5c2e18-c22e-49ce-8da9-b452f91ab55e', '56cc63ee-de99-477c-99ef-545b42f6be54']","['mteb-retrieve__DDJKywm', 'mteb-retrieve__S5XvJGT', 'mteb-retrieve__3BCXzz8', 'mteb-retrieve__bW2Kwyp', 'mteb-retrieve__3sjYUwS']",0,"[230.947369, 326.776511, 214.508221, 189.050685, 118.603113]","[7.721069, 12.776312, 4.434374, 4.291891, 113.386389]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,nginx-request-logging,5,"['689b6712-a73d-42e5-8dfb-45303790a1dd', '7544d79b-faf8-4792-b142-3881601ce82f', '867b8355-51c6-448c-ab85-dd6c5f60f3c9', 'fd0b345a-0e8a-4382-8f39-5335d3c6cf32', 'dcd9bf4c-f222-4839-9c74-b8bf09bb1c73']","['nginx-request-logging__PYQmiKY', 'nginx-request-logging__g8mcdh4', 'nginx-request-logging__bWTWrEG', 'nginx-request-logging__oy2MEeZ', 'nginx-request-logging__TRBuX4i']",2,"[1028.651128, 900.532029, 559.022787, 664.485247, 819.207408]","[19.325006, 16.937329, 164.258055, 31.671776, 102.591371]",0.4,False,"['7544d79b-faf8-4792-b142-3881601ce82f', 'fd0b345a-0e8a-4382-8f39-5335d3c6cf32']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,openssl-selfsigned-cert,5,"['dad2e1e9-306e-4c4f-b05c-93f924c4992b', 'ff0f19ea-58f9-40d2-8a69-eb756626c9ed', '71c3752a-1ee1-4939-a0aa-0ecce60cf68a', 'c6777baf-6c7c-46b2-adf0-0fbd828de527', '89e1f170-07d3-43c8-9b18-f8a4eb41c9d4']","['openssl-selfsigned-cert__qRbnxah', 'openssl-selfsigned-cert__397APdB', 'openssl-selfsigned-cert__tr7Bb7R', 'openssl-selfsigned-cert__F2WYNRC', 'openssl-selfsigned-cert__9fHqcTg']",2,"[715.499315, 181.191757, 169.391154, 415.117961, 166.120489]","[60.580249, 17.555905, 28.385653, 25.749919, 30.022484]",0.4,False,"['71c3752a-1ee1-4939-a0aa-0ecce60cf68a', '89e1f170-07d3-43c8-9b18-f8a4eb41c9d4']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,password-recovery,5,"['b0174e4f-1dbc-4e8d-92a7-1ea442ffc51e', 'd7ad3f3c-4088-4f8b-b5dc-6f031e954c42', '12c0dcf6-c511-46a3-b3a8-5426c50b5e9a', '0167e4f1-558a-499f-b095-933391437034', '3c1113be-ffdc-4de1-a295-0795935b2ff4']","['password-recovery__bMNi2Yv', 'password-recovery__qxdpUAu', 'password-recovery__4yPuVk9', 'password-recovery__6VVdwv4', 'password-recovery__e45uXyh']",1,"[1551.820187, 924.365593, 904.441979, 910.24323, 796.656521]","[115.389726, 38.406723, 24.921196, 32.803429, 32.386428]",0.2,False,['3c1113be-ffdc-4de1-a295-0795935b2ff4'] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing,5,"['7500d5de-a64f-4104-a6e6-002c45ce48b3', 'da84d717-2fc7-4902-99a5-70ebcdc7056a', '2801141f-7806-407c-8253-5288388fda09', '58cd1a5b-7c80-490f-a5ac-7810ca708f1b', '84c0a330-2689-4f7f-9b06-914d3f358b4e']","['path-tracing__ZZuV2ZC', 'path-tracing__Ff3pNp4', 'path-tracing__CPaqBRP', 'path-tracing__CnFR6p6', 'path-tracing__UPATGr7']",0,"[1805.165513, 320.513078, 1119.455138, 1154.238242, 620.858057]","[76.456264, 21.026877, 50.820294, 93.535552, 7.023899]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing-reverse,5,"['2c36bc67-529e-4625-8780-881b2996ac0b', 'da870387-d393-45d9-a4d9-aae3f8e0b20f', '306f1740-3fca-41cc-a41c-61a286cbdbbd', 'e4bcdc8f-fc92-4aa9-b6fc-23f4e4f6c565', 'd17f5380-55a8-4cbf-a809-50e5f84e4d85']","['path-tracing-reverse__nqXqqMV', 'path-tracing-reverse__cxdmHMg', 'path-tracing-reverse__32AsR8b', 'path-tracing-reverse__SS48bDT', 'path-tracing-reverse__DadwiTZ']",0,"[1077.740802, 1011.309079, 1824.024906, 1840.649835, 1475.115557]","[38.439968, 82.257527, 50.576286, 52.722128, 18.749882]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-c-py,5,"['96138730-f61a-4694-90c5-cff3013f4fa4', '53384d0b-c0fe-455d-aec6-0dccdcf3516b', '94437be0-6127-4e60-9d04-0ab1ce858c18', '86039e9d-c8a4-4d01-b5a0-09f5cb93f03a', '42506c05-0b8f-44c5-bdf9-471d096039eb']","['polyglot-c-py__2vhxHft', 'polyglot-c-py__BLxpfFd', 'polyglot-c-py__S4R3uAR', 'polyglot-c-py__JFsgM7E', 'polyglot-c-py__7yG2LHs']",0,"[645.758931, 276.795469, 900.017569, 910.368116, 900.021209]","[98.922845, 42.044261, 39.204978, 29.459725, 18.664754]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-rust-c,5,"['f103b773-8968-4255-8010-51bd4d12d885', 'ad923874-ba26-47b4-910b-65c45878a365', '1a00b578-0289-44b6-ac5c-159e90734e2d', '2aba641d-7392-4150-a147-6d3889b8ffed', 'a28b88cf-dd7c-48b8-8cb9-303aa3ede905']","['polyglot-rust-c__zULG5rb', 'polyglot-rust-c__U5urFN7', 'polyglot-rust-c__hqEhYTK', 'polyglot-rust-c__ESUKMPX', 'polyglot-rust-c__VR9mNbz']",0,"[934.293, 903.469799, 913.178116, 900.098759, 969.394023]","[101.045948, 162.991682, 124.60954, 276.624563, 57.660151]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,port-compressor,8,"['28a9158a-9005-4996-a870-e363a30af346', '51c3aa97-9c56-4bef-8fe4-1fa6065b2e7b', 'b59b9cb4-f824-4081-b887-928ae94f3714', '4befc5da-a436-472a-abb8-ad979455e306', 'd79fa122-ecd8-46d8-993a-066b8fe48c5d', 'ef762438-6043-4a42-a45a-b9b481840ac6', '8db551d9-2c26-4240-9690-62caf946da55', 'b9eccab8-ff11-4122-a4ab-f070a092cd75']","['port-compressor__Jo7KfnL', 'port-compressor__YWcxq44', 'port-compressor__zQpnDE9', 'port-compressor__VQVza72', 'port-compressor__YFCSXNj', 'port-compressor__dGrWYKD', 'port-compressor__LdZXC3q', 'port-compressor__qwxFuso']",0,"[3606.503901, 3600.001236, 3023.158004, 3600.001221, 3600.012846, 3600.471402, 3631.215361, 3620.130999]","[163.261978, 8.99425, 32.758919, 11.584992, 15.49711, 70.891101, 56.872722, 94.278499]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,prove-plus-comm,5,"['4950fe5c-3af4-45d7-a081-14d6a0e07d4c', 'c19d4e24-023a-4add-b057-7000c90bb0a6', '9c2fe063-782e-40e1-ae1d-b58d66d2c509', 'dc2307f9-bb45-42a0-a9d9-98cb6da01938', '36736c49-f973-4f04-a4d6-0f70f8b434da']","['prove-plus-comm__WmhHmvT', 'prove-plus-comm__XB3QU5C', 'prove-plus-comm__UUpejzd', 'prove-plus-comm__KoyHKGT', 'prove-plus-comm__33ztmP4']",1,"[918.028176, 171.709209, 900.492358, 913.233448, 421.592904]","[71.236606, 60.574584, 99.077601, 26.460775, 21.154305]",0.2,False,['c19d4e24-023a-4add-b057-7000c90bb0a6'] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pypi-server,5,"['6ef22d23-a879-40d3-8a98-ed05816976ae', '1da65ffb-e7a9-4ee8-8839-871df824e61a', '3f78b1e8-cb9d-4af8-b2c7-e903385708df', 'b8db9335-78b1-4bed-b311-101d54fe3041', 'ce1ba356-19d9-43bb-bae1-220cb6d8d8bc']","['pypi-server__dZHdpoV', 'pypi-server__ystWeVP', 'pypi-server__RmzS3Xo', 'pypi-server__wc6PPvt', 'pypi-server__5m4huNZ']",0,"[713.294589, 540.424395, 916.468089, 900.033032, 905.443565]","[36.301268, 50.303853, 58.175051, 15.279564, 53.300196]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-cli,5,"['f24f41b4-cc98-4e13-8806-ece358093e32', '3e0b43ee-d1db-4a8c-9ac2-e4e15da730cb', 'f11df8b3-737e-4ccf-b4a5-ef18c483681e', '2d83485b-af72-448b-8644-258d388ba039', '110ceb01-9bb6-4ee9-a536-3befcdc6dfaf']","['pytorch-model-cli__cRBziR8', 'pytorch-model-cli__5yCH79o', 'pytorch-model-cli__ySAdAYw', 'pytorch-model-cli__jwwbFtv', 'pytorch-model-cli__DQ9eXhH']",0,"[817.143022, 900.338713, 494.687185, 627.12886, 519.175958]","[61.250292, 68.738528, 17.918739, 134.879992, 28.378745]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-recovery,5,"['e6572517-37bf-41b4-b946-125ef1b835fa', 'a16a7f97-95db-440a-a0fa-8c634070f020', '07929289-c988-4c7d-bed9-2e2cb0248511', '4fd8980d-e426-4a44-9874-36ec457c15f8', 'd7e18913-fb5c-49a4-a3ed-6633139ee79b']","['pytorch-model-recovery__d8ZtC6x', 'pytorch-model-recovery__uRvzBRn', 'pytorch-model-recovery__yJeJF6G', 'pytorch-model-recovery__h5JF2Re', 'pytorch-model-recovery__TRAGoM9']",4,"[900.633301, 903.378763, 751.309458, 430.819549, 902.05764]","[30.883103, 53.457161, 43.390339, 11.826565, 70.020075]",0.8,True,"['e6572517-37bf-41b4-b946-125ef1b835fa', 'a16a7f97-95db-440a-a0fa-8c634070f020', '07929289-c988-4c7d-bed9-2e2cb0248511', '4fd8980d-e426-4a44-9874-36ec457c15f8']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-alpine-ssh,5,"['d4b87041-cda1-4319-8c0c-2e2d61f42e52', '3b091743-9d58-4880-a98a-afdf2fd0a4ed', 'd7af7174-d4be-4866-9e6e-959bfaedf1b8', '4c591c36-a783-4cac-bec6-27deca072d9f', '83308219-5470-4a16-9a38-37fa964effc5']","['qemu-alpine-ssh__6oGjx8V', 'qemu-alpine-ssh__RmHdqfp', 'qemu-alpine-ssh__4Pqh47E', 'qemu-alpine-ssh__ekHA5X3', 'qemu-alpine-ssh__BibBxZa']",1,"[950.905527, 904.12361, 916.920913, 1042.147924, 933.500665]","[9.837422, 28.21325, 4.473999, 9.646792, 13.799776]",0.2,False,['d4b87041-cda1-4319-8c0c-2e2d61f42e52'] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-startup,5,"['ffd4ac71-08c4-4de3-9c7d-359959bca4eb', '36de5c8a-60aa-4341-9049-1fdc98684b9d', 'c5404025-c58d-40ba-a1d2-074dd8cec48e', '120412fd-90b8-40e2-99cf-4ee0a21cec29', 'f7dffa74-2af0-4d70-8602-531047175d88']","['qemu-startup__RSBF3NR', 'qemu-startup__tTgZb4H', 'qemu-startup__65sxhCf', 'qemu-startup__mN3Y4qV', 'qemu-startup__wnvYtmn']",0,"[484.467271, 985.877287, 423.513362, 328.085657, 903.169268]","[14.724536, 33.329235, 17.928102, 36.163478, 3.132949]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,regex-log,5,"['9679a48a-c639-4284-b212-2b0f33001376', 'e528c6d2-364a-4733-9e8b-45df229c6e62', 'e2502451-d4ef-4f33-9466-cd239cc9208a', '39f86d6b-ac6e-485f-ab7c-d5a2198be334', '4ea25959-ffb9-4bd7-881e-b9fdf873a331']","['regex-log__yX9Fspk', 'regex-log__GpATmgg', 'regex-log__AHigQKG', 'regex-log__TZTXVEn', 'regex-log__bY52NPt']",1,"[837.614507, 595.950667, 283.320473, 169.47116, 253.577828]","[122.608796, 188.96036, 80.887695, 132.992643, 111.94208]",0.2,False,['9679a48a-c639-4284-b212-2b0f33001376'] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reshard-c4-data,5,"['61674130-ed1a-4ff1-81a9-250181621a7b', 'b5d051e6-2e82-45ab-8b36-3cec87526505', '987274e9-3af2-4985-a9ab-caed1fafbf2f', 'caec024e-5e88-4670-a6b6-5ba5cfcfa517', '0629b802-6f0c-4fbe-850d-5ddd8edda6f9']","['reshard-c4-data__UEBmp2w', 'reshard-c4-data__jymFLDZ', 'reshard-c4-data__EQNzYez', 'reshard-c4-data__NXpLXQ2', 'reshard-c4-data__VbYun4C']",0,"[2067.149465, 900.415971, 902.722468, 901.364213, 920.520015]","[22.45284, 18.812733, 107.143788, 62.864361, 109.016309]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reverse-engineering,5,"['bb68e8e4-4743-44f6-8942-6991e1ff517c', 'a5e4f0bd-a43f-4ae8-85fe-0ef66ea804db', '5f1db1e7-b797-47b4-af5f-b544d065ca23', '8f2413db-2f65-4407-a2db-9778a2a2abe5', '3f5a6d24-6e1d-4bfa-9ebf-56952f550972']","['reverse-engineering__rkfcw9B', 'reverse-engineering__PGaK4hr', 'reverse-engineering__q4WCkTF', 'reverse-engineering__MSCf7XG', 'reverse-engineering__6ES3vfR']",0,"[1801.072754, 1800.046909, 2578.574091, 1807.866536, 1804.727068]","[21.867555, 67.512781, 38.277869, 7.275086, 35.536231]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,run-pdp11-code,5,"['6ec28ab7-d65a-46e3-9029-5aefe40b8c44', '45b2f304-ae64-45a4-8558-4e70379cd240', '2f141cf1-85a6-4582-a4cf-1b8d7e98a967', 'a8a4cbe5-c513-4402-8427-f59e35c9f280', 'e1ad5434-ef3e-4d1b-a619-2a1b1b7a347f']","['run-pdp11-code__MFPPEEU', 'run-pdp11-code__fTbuWve', 'run-pdp11-code__BLHUqJ2', 'run-pdp11-code__cgQiKuC', 'run-pdp11-code__Q2HuXha']",0,"[1016.778645, 1002.416079, 1064.575988, 557.633957, 1037.034821]","[115.384091, 36.417422, 304.950596, 24.703851, 40.615138]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sanitize-git-repo,5,"['841cb7ef-442e-440b-971d-2ceb424ef6fa', 'c4d34cee-3c07-42c1-a333-aa5b92c0b7a9', 'fa6a4c84-53ba-4db3-9a2b-93f90c51c384', '865a1dbd-87b9-4299-960b-266a47f8fccd', '8562de32-7234-4140-bd24-bd6d836e7ab2']","['sanitize-git-repo__rg5kSdv', 'sanitize-git-repo__XZMBLWY', 'sanitize-git-repo__jRGugtw', 'sanitize-git-repo__swjxNeM', 'sanitize-git-repo__gEMwWgc']",0,"[338.235869, 566.58534, 685.862373, 368.31449, 924.262306]","[12.867351, 29.061723, 41.638324, 27.831983, 72.027955]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,schemelike-metacircular-eval,5,"['fe1ac5d2-7cbe-4703-8fd2-c437d053b0b9', 'f3d5209f-75c1-469d-a2f2-394a1e52c804', '8b9d43ac-8bcb-44b7-afc7-0c0e222215f7', '6fa06099-a8bd-4ff8-b824-16b2daa5eea2', '19b899fb-4901-4c1b-99f3-298517133102']","['schemelike-metacircular-eval__uRbvtK5', 'schemelike-metacircular-eval__ZC69a62', 'schemelike-metacircular-eval__yxhQTnq', 'schemelike-metacircular-eval__RE5GBi8', 'schemelike-metacircular-eval__fFVCULy']",0,"[1588.052894, 2406.472815, 1993.440478, 1705.2129, 521.083524]","[45.660359, 27.029698, 62.42163, 97.769285, 42.521746]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sparql-university,5,"['61c6711c-c079-4f82-8c38-a34fb167d390', '0443b97d-fb79-40d8-8221-e8fb98f8b037', '96af64fe-5703-4aa1-8d21-eaed8b288382', '8a684b88-63bb-4b0a-b5b4-0ef90a464515', '5e091d0c-f174-4d2e-8459-f389aa1e56a8']","['sparql-university__tmLuyKu', 'sparql-university__LUfVjui', 'sparql-university__Qw8BbXY', 'sparql-university__z6SphQN', 'sparql-university__QsWHwWw']",0,"[242.737937, 197.593441, 345.050973, 330.063359, 740.661314]","[26.648831, 36.100445, 28.034718, 47.434951, 88.462879]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-db-truncate,5,"['b14da1d4-649f-4ba6-a2b1-72aaeb523af0', '32847b81-c54f-40ef-aea3-69e7c59819a2', 'bf255481-ad29-4dd8-8c91-b83637ecd598', 'c11658db-3f80-4a84-afb6-562cf84011da', 'd985b6b2-99b4-436b-9282-e633c1439311']","['sqlite-db-truncate__5UwQxQH', 'sqlite-db-truncate__zbdhU7u', 'sqlite-db-truncate__kWAaC8R', 'sqlite-db-truncate__YgBXMtc', 'sqlite-db-truncate__RAycvxZ']",0,"[459.544682, 102.045474, 909.242928, 267.649291, 912.580101]","[13.888787, 13.518836, 119.810266, 55.359395, 51.195039]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-with-gcov,5,"['97fbbc39-736d-4f5c-9f68-baf75a97efd1', '0b00c9f8-4f8a-4583-bdde-4b1ad6d8e374', 'ef1dfe3a-22d5-4aa2-9d81-f53220c3591f', '803364a1-8a6d-405a-b9c5-09b8adb8bcce', '04c418bf-6408-49af-8cb0-063ba47cac4f']","['sqlite-with-gcov__n5tHLe8', 'sqlite-with-gcov__yUXakDm', 'sqlite-with-gcov__jLvt65X', 'sqlite-with-gcov__KazT9kz', 'sqlite-with-gcov__zi4LBgG']",3,"[528.388895, 573.841481, 281.09867, 464.546568, 536.338517]","[60.989955, 129.459355, 36.357548, 60.452216, 50.832145]",0.6,True,"['97fbbc39-736d-4f5c-9f68-baf75a97efd1', '0b00c9f8-4f8a-4583-bdde-4b1ad6d8e374', '04c418bf-6408-49af-8cb0-063ba47cac4f']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,torch-tensor-parallelism,5,"['51b82477-b3b9-4992-8b98-e28c1600dc68', '29f04105-1318-4344-a102-34391b76d4e1', 'f3d56195-48ad-4244-8618-3389b534b8c0', '856688c1-a118-4a91-87f9-6d6ceec6479f', '94289b2a-8326-4d30-a761-a6322b7c715d']","['torch-tensor-parallelism__zfaJQX6', 'torch-tensor-parallelism__QFsAopU', 'torch-tensor-parallelism__Qo9mfdJ', 'torch-tensor-parallelism__3AAGAko', 'torch-tensor-parallelism__6BLwi8D']",0,"[294.167971, 94.44862, 915.468369, 171.888906, 246.88208]","[49.093982, 28.279927, 52.620394, 36.92883, 14.466311]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,train-fasttext,5,"['3047ae54-efed-4b96-8549-4751dffdb665', 'e6fc1e44-e6f2-4a78-97b1-39d4d7c8f08f', 'cb0a58be-813e-4e99-b67a-5b033eeeeceb', '53ef0924-cdc3-428e-803a-61a001840766', '8c00bb8f-5bfd-4ff7-8c0c-966207be7589']","['train-fasttext__SULzXPZ', 'train-fasttext__QwLe63X', 'train-fasttext__qMC7uKi', 'train-fasttext__QHJj6Bv', 'train-fasttext__BfHxoeu']",0,"[3600.005859, 3600.005803, 3384.744772, 2193.987261, 2789.764409]","[121.376611, 46.10825, 22.724076, 29.065385, 61.461353]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,tune-mjcf,5,"['82b5839d-886d-40b5-a852-1653cdec6b06', 'bb53acdd-4535-4c63-bcbc-affdf4a87c43', '6880c3c6-dc10-4fa4-89a1-15bb36475bc2', '58b84e9a-c6b1-432f-9154-39c16c5c6c4e', '6d020c64-9f1a-4787-981b-809db23d7fe4']","['tune-mjcf__e3V7AN7', 'tune-mjcf__tuQ8c4N', 'tune-mjcf__ezGe6sb', 'tune-mjcf__bEsrSZf', 'tune-mjcf__5uzmco3']",0,"[900.150001, 905.38447, 926.405488, 903.975567, 912.085006]","[11.601399, 14.983068, 20.518119, 24.793314, 16.428378]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,video-processing,5,"['dce71606-3c3d-44ec-82c9-2ff2b6b90017', '30e53f46-c864-4daa-9f4f-f53179e3b3a8', '778d0912-eb5d-4fbd-9e64-1536cd1b248d', '471a30d0-ad55-4fee-bae0-ffd41c9c740e', 'aa4c500f-9ac3-4d13-b2cd-d6b2a24a91ee']","['video-processing__eHoxUNq', 'video-processing__uyrZjKF', 'video-processing__SkhkTNC', 'video-processing__k7VMEAw', 'video-processing__gsQxecr']",0,"[734.966628, 347.069534, 191.416571, 146.085358, 214.152491]","[71.428915, 66.952552, 17.696547, 158.528616, 18.251384]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,vulnerable-secret,5,"['5758f3f6-7ba3-43a3-927a-2acee10ea356', 'cb14cfbb-c94d-4084-b37e-911fe14b8535', '95cced3d-837a-4195-aca9-a18ea1133954', 'bd5ec0ab-6205-4d82-8744-c6f95775a718', 'b59ecf56-52bd-4a33-ad47-8fa0193f959e']","['vulnerable-secret__ovgxzsP', 'vulnerable-secret__q7xvGJv', 'vulnerable-secret__QdCccjZ', 'vulnerable-secret__VJNGUWR', 'vulnerable-secret__vAUEYAu']",2,"[909.040839, 883.723027, 900.17298, 506.285393, 906.910553]","[47.138019, 24.524782, 10.234568, 59.841587, 16.46195]",0.4,False,"['cb14cfbb-c94d-4084-b37e-911fe14b8535', 'bd5ec0ab-6205-4d82-8744-c6f95775a718']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,wasm-pipeline,5,"['5521ae71-8218-46ff-be18-bf4bf78cf3ae', 'c1240fdb-3584-4259-b968-0f7319f290ef', '62c9f64c-22ce-423a-925c-9427a28367a3', '063e0a84-f376-4612-aa21-b3b3635d7220', '2ae55719-bbc1-4e65-9991-32578fd559c0']","['wasm-pipeline__tgN57Pt', 'wasm-pipeline__Ei5pmD7', 'wasm-pipeline__jsRicTa', 'wasm-pipeline__M2CrrBY', 'wasm-pipeline__MYegqMz']",3,"[668.711147, 902.518384, 912.009142, 819.460915, 861.04068]","[20.876757, 39.225768, 5.690126, 7.893707, 21.987688]",0.6,True,"['5521ae71-8218-46ff-be18-bf4bf78cf3ae', '063e0a84-f376-4612-aa21-b3b3635d7220', '2ae55719-bbc1-4e65-9991-32578fd559c0']" +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,winning-avg-corewars,5,"['3b796342-349c-4df3-9f6a-945109d63b02', '5c64a0ce-0d37-43dd-b734-44f1e0bbd3f2', 'ddd65d26-9828-4fb6-8842-5544683a07b4', '24edb57e-b515-4450-817f-dbb41af0cf48', '83ff0bfd-63ae-4cd1-959f-13edd7c0d9e2']","['winning-avg-corewars__rwg6DJ3', 'winning-avg-corewars__XdMAssP', 'winning-avg-corewars__jPye5yy', 'winning-avg-corewars__8NvuGHh', 'winning-avg-corewars__u8X49pk']",0,"[3617.791612, 1018.186355, 2644.987331, 2908.69855, 2500.151304]","[80.313467, 7.097878, 14.079213, 28.659943, 64.508308]",0.0,False,[] +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,write-compressor,5,"['4e597b9a-c5ef-4b59-8223-5e86513af6fb', 'c1a1c713-f23f-4ecb-8c5e-65013e98ff1a', '868b95de-384a-49f1-bd00-8bff2712c038', '5118648f-de26-4aff-8431-44add62f6a71', '4ded7305-b551-4435-83d2-75e77477c6ec']","['write-compressor__xieNdbi', 'write-compressor__KjaJ3nh', 'write-compressor__cxzdaAZ', 'write-compressor__oKR6UJJ', 'write-compressor__mspkEBd']",0,"[946.012866, 904.311186, 1416.734966, 357.40933, 609.812507]","[23.341344, 144.140971, 19.09455, 75.876899, 26.6544]",0.0,False,[] +claude-opus-4-1-20250805,adaptive-rejection-sampler,8,"['1284a529-edbb-4347-bd59-bd5493da2c4a', '7daac61f-ef7f-4e79-899d-002f4b720853', 'ad324328-3962-49e4-9455-cdda48b9045c', 'e11be6ad-07a4-4552-8375-4a138ee7911e', '5cd2324a-63e5-4417-9edc-755ac39359d3', '4fcdd852-4c82-4729-b5cc-7762b7e288dc', '4585c41e-32e5-405b-8c54-19fc2ced7d3d', '3024e72e-2c78-48bc-aa7a-8da2915a1b92']","['adaptive-rejection-sampler__aNXbUZg', 'adaptive-rejection-sampler__mQenUWg', 'adaptive-rejection-sampler__U24Ypcy', 'adaptive-rejection-sampler__QNC78Ao', 'adaptive-rejection-sampler__TUaCEQD', 'adaptive-rejection-sampler__Bg56nSf', 'adaptive-rejection-sampler__QMqUhff', 'adaptive-rejection-sampler__SQ8moUR']",1,"[2121.535579, 900.000748, 1318.187283, 904.121964, 947.652979, 901.03392, 900.001006, 906.380667]","[30.8222, 60.747592, 16.022372, 19.848566, 65.753639, 49.005965, 19.78082, 48.154178]",0.125,False,['7daac61f-ef7f-4e79-899d-002f4b720853'] +claude-opus-4-1-20250805,bn-fit-modify,8,"['e4aa94c8-ec8b-4fbd-ab1e-66ad614990e1', '1fa20ee9-325e-46c4-b090-22368e10c9b2', '3acd3c36-8da2-4cb2-b6c3-78e51ad977d3', '46a7e4ae-b4d5-4053-bea5-842dec05f212', '898cac89-d695-46db-8ab4-5a67c86a074e', '4de09ee5-4ae9-449a-9d06-264f3f435c83', '28255882-cd6a-4aeb-9850-cd41da942f9f', 'f8518e6e-75f5-451b-bbf4-e9280009b305']","['bn-fit-modify__3668zBi', 'bn-fit-modify__x8Bppfs', 'bn-fit-modify__aRZsDm7', 'bn-fit-modify__pvg7a2A', 'bn-fit-modify__XuBsjw2', 'bn-fit-modify__LAetN6k', 'bn-fit-modify__QZhu97h', 'bn-fit-modify__gsHCxzi']",7,"[492.502431, 556.406186, 709.066568, 3148.396303, 312.339663, 429.705317, 2010.089567, 434.211663]","[208.916357, 20.663706, 69.926148, 13.28266, 18.545732, 10.118221, 14.436303, 66.928621]",0.875,True,"['e4aa94c8-ec8b-4fbd-ab1e-66ad614990e1', '3acd3c36-8da2-4cb2-b6c3-78e51ad977d3', '46a7e4ae-b4d5-4053-bea5-842dec05f212', '898cac89-d695-46db-8ab4-5a67c86a074e', '4de09ee5-4ae9-449a-9d06-264f3f435c83', '28255882-cd6a-4aeb-9850-cd41da942f9f', 'f8518e6e-75f5-451b-bbf4-e9280009b305']" +claude-opus-4-1-20250805,break-filter-js-from-html,9,"['0008e336-0b20-40c1-a7b7-171a24dedb1e', 'f7fa1c4c-d940-4b04-b3c8-5186d91383e3', 'bc3ae8b5-74fc-4454-9b09-a9ca11863b7f', 'f9f5040e-e07c-4047-a7bf-f0d6b5f78e7a', '07abddd0-8a13-4559-a31b-137e7b339203', '4cd8953f-32d0-4fd7-9d10-702963de9804', 'ae860e5c-7fea-4d0c-913e-dea5e3ba38c5', 'b4def6cd-da27-405b-b54f-a69b96fbb0fc', 'c821726f-7ac8-4249-ae40-9a12c199e9b8']","['break-filter-js-from-html__85Ap7Ca', 'break-filter-js-from-html__6FbY7vE', 'break-filter-js-from-html__R3XMLke', 'break-filter-js-from-html__kkku7Zn', 'break-filter-js-from-html__64xZqe3', 'break-filter-js-from-html__67ktJQm', 'break-filter-js-from-html__gTW5r3D', 'break-filter-js-from-html__BnN4bPN', 'break-filter-js-from-html__V37rVQg']",2,"[1200.000446, 1038.054024, 1433.311452, 1200.001203, 1220.980814, 1210.427035, 1204.059704, 1228.124283, 1200.301857]","[14.670786, 56.892474, 36.205352, 6.620019, 16.103186, 106.929811, 12.890103, 7.217558, 11.799534]",0.2222222222222222,False,"['f7fa1c4c-d940-4b04-b3c8-5186d91383e3', 'ae860e5c-7fea-4d0c-913e-dea5e3ba38c5']" +claude-opus-4-1-20250805,build-cython-ext,7,"['dc758f7d-3f57-4366-863d-254582068199', 'b2072ee7-71b9-4ff6-a7fd-c3c994739765', '66f07cd7-3358-4af9-b076-f2572a615b71', 'ab6108e2-5c89-4b49-a6bb-ab401aa260d6', '0e8eb221-0ed3-4301-b90e-7c14d7552466', 'b5c07074-3df7-4b5d-ad8b-e16c1d69fe88', 'c67f451d-6fbc-413a-b078-19d09aa4fff5']","['build-cython-ext__HZueAk9', 'build-cython-ext__xP99Gtr', 'build-cython-ext__Ajz4Sc2', 'build-cython-ext__ZeNnx59', 'build-cython-ext__u4DA384', 'build-cython-ext__kHMDH8b', 'build-cython-ext__SGc8t5g']",0,"[900.239924, 906.73594, 908.751913, 391.65488, 355.528366, 1106.463119, 819.120516]","[9.905421, 95.251746, 80.76814, 14.216452, 10.423655, 14.086483, 38.131282]",0.0,False,[] +claude-opus-4-1-20250805,build-initramfs-qemu,5,"['4b09af71-aea2-4f2e-af72-ba09df9983d2', '38177e56-a04d-43b5-a30a-3268bac4afdc', 'fdf2e318-f7d6-4ad5-bb3f-3dbb1dc3caab', 'aa6f7e7e-5074-43b9-89ec-24775f66a5be', '9e72a9be-9370-43c2-8806-ec0d8b681445']","['build-initramfs-qemu__M6Kv8s8', 'build-initramfs-qemu__LyAPXoa', 'build-initramfs-qemu__GtFR5zc', 'build-initramfs-qemu__f59ahg2', 'build-initramfs-qemu__Yd3HaRr']",0,"[266.960812, 833.239931, 915.374893, 1765.657198, 941.034192]","[10.113314, 18.74592, 26.66418, 11.025914, 43.196876]",0.0,False,[] +claude-opus-4-1-20250805,build-pmars,8,"['f81f030a-7184-492c-aab0-5745976961b6', '34f30856-3acf-421e-8f76-960f02eb687e', 'a2634787-a53f-4c61-a5cf-f66a9c524ee7', 'f80a04e9-2b60-4aff-8a2c-4a6ea03bf2c5', 'bd2b3632-1ec9-4cef-87c6-b88e2d37e711', '404d5ee1-69e0-4edb-aa19-be0318d96bc8', '16278f11-4364-400b-a421-3e0ccb0320e1', '1201fa4c-80d4-4052-92f3-00e3055cc4a1']","['build-pmars__zQJTLbR', 'build-pmars__97G9bXy', 'build-pmars__3ietDrq', 'build-pmars__ZpQBDW2', 'build-pmars__poa6rsA', 'build-pmars__x847F5v', 'build-pmars__8HBKAaJ', 'build-pmars__UE3R8qn']",4,"[1774.903555, 435.413576, 216.313743, 160.044596, 600.126326, 240.389111, 284.202395, 426.776973]","[1.921645, 15.035574, 5.845382, 2.414952, 41.367095, 1.908836, 5.609373, 71.957622]",0.5,False,"['34f30856-3acf-421e-8f76-960f02eb687e', 'a2634787-a53f-4c61-a5cf-f66a9c524ee7', 'f80a04e9-2b60-4aff-8a2c-4a6ea03bf2c5', '404d5ee1-69e0-4edb-aa19-be0318d96bc8']" +claude-opus-4-1-20250805,build-pov-ray,8,"['a628caf2-3b24-4267-b396-6224b0ea28fb', 'f4e058fb-b6e6-4e75-8350-6c6322d9bc0c', 'e6dab586-0ee2-4913-96ca-b84e461dd698', 'f74ef816-d76c-414c-aea2-2164d75f612b', 'b5f2ac72-f0bf-4b5a-88e2-9466b5bf0c68', '142f0af5-5153-4871-bef3-eef70b2bba15', 'b6438a72-dbf2-409a-8095-03cd4feb0650', '07f4f9ae-1f07-461f-90bb-708c8eae9d4f']","['build-pov-ray__ktj84UJ', 'build-pov-ray__AFKLrmJ', 'build-pov-ray__5SjoSWu', 'build-pov-ray__hUwi2H4', 'build-pov-ray__UP8iWaf', 'build-pov-ray__cmAybvu', 'build-pov-ray__bXfsai9', 'build-pov-ray__R6YUTY6']",6,"[600.042798, 1037.054903, 2203.271707, 872.578565, 637.10085, 912.703749, 3200.760685, 964.374654]","[20.772125, 55.863131, 14.650231, 22.888486, 12.651929, 30.452545, 15.879534, 14.345967]",0.75,True,"['a628caf2-3b24-4267-b396-6224b0ea28fb', 'f4e058fb-b6e6-4e75-8350-6c6322d9bc0c', 'f74ef816-d76c-414c-aea2-2164d75f612b', '142f0af5-5153-4871-bef3-eef70b2bba15', 'b6438a72-dbf2-409a-8095-03cd4feb0650', '07f4f9ae-1f07-461f-90bb-708c8eae9d4f']" +claude-opus-4-1-20250805,cancel-async-tasks,8,"['81c631c5-77cd-4231-80df-01857bd8a03d', 'dae63725-cd6a-488a-a0b7-0442580f9738', '10d323a3-9f96-4154-84df-6e09898863ea', 'de65f11d-d2b3-4458-b327-303bc6cc7d61', '9019bce4-5144-444b-a5c5-17943cf89756', 'a58d9461-6cc5-4423-886a-a4bd539608a0', '9c21b970-70c9-4ed9-9225-3359366bc77c', 'ad2e2a58-29a6-4ebe-8cde-b779f4157310']","['cancel-async-tasks__RqwadXv', 'cancel-async-tasks__XcbXZFZ', 'cancel-async-tasks__n6YNYQ3', 'cancel-async-tasks__uuyWVZc', 'cancel-async-tasks__9Y8xySa', 'cancel-async-tasks__fN2Dxah', 'cancel-async-tasks__k9Rhrgy', 'cancel-async-tasks__mTh3HWE']",1,"[323.441293, 76.752674, 270.692221, 798.728735, 407.661187, 103.413376, 70.458081, 215.321108]","[116.464477, 17.675938, 51.046011, 181.37061, 117.77172, 9.818332, 16.305025, 45.066109]",0.125,False,['de65f11d-d2b3-4458-b327-303bc6cc7d61'] +claude-opus-4-1-20250805,chess-best-move,8,"['e027b7b1-63bc-40f8-bf55-51fafff0b103', '502642eb-5cb7-4ed0-8925-7b6914690fb8', '8227ce3b-f492-42f1-9e3e-9de905181565', '4b7c492e-dc66-4108-b1cc-1b6556c81c6b', '48d930a6-c9db-436f-9676-5908dd4cb973', '40d35fb2-9ae6-4beb-b77e-ba2bc8c2fa33', '28b74edb-9e8f-4070-9d4b-705ed1b21176', '72e42d17-1f28-41be-a728-8c1dfb07c1a1']","['chess-best-move__woXxTbX', 'chess-best-move__AopnNGw', 'chess-best-move__SvPSfjh', 'chess-best-move__iQgZi38', 'chess-best-move__mozNRDv', 'chess-best-move__JVRAAny', 'chess-best-move__5vmaUuy', 'chess-best-move__NBT5Zqv']",0,"[216.625252, 336.264846, 672.948844, 210.156209, 389.608364, 231.781019, 271.049721, 578.983481]","[10.021319, 14.065744, 16.677027, 7.133927, 16.131998, 20.034351, 22.940062, 321.257429]",0.0,False,[] +claude-opus-4-1-20250805,circuit-fibsqrt,8,"['b49e398c-2fc2-473e-8937-2b3876543994', '17a91017-f88a-4642-abd9-af2d7d03aa99', '9e7a0b84-264c-42ff-b403-90d9702e7d62', '05da3efd-d0f3-4a02-b588-b84c9904fc0e', 'c537c24f-7017-4b27-b700-0640307d24e4', 'c3be3873-dfd1-44ad-a02f-df4888b8fd32', 'e359f792-5f92-4b75-b18d-ca66c5589226', '9d23b336-3fc2-4536-a311-817fd8e460ba']","['circuit-fibsqrt__G7jdjxF', 'circuit-fibsqrt__NmGu9JF', 'circuit-fibsqrt__CYogEna', 'circuit-fibsqrt__ncSh73X', 'circuit-fibsqrt__4CVduAF', 'circuit-fibsqrt__DNhjbbV', 'circuit-fibsqrt__ZCmSkdH', 'circuit-fibsqrt__btYsAYW']",0,"[3605.205582, 518.937269, 3612.399691, 724.351243, 3606.374705, 1077.280833, 3600.00101, 3546.749669]","[28.33026, 8.624163, 19.141838, 8.01077, 78.073332, 15.591136, 7.711508, 53.70866]",0.0,False,[] +claude-opus-4-1-20250805,cobol-modernization,8,"['311b3138-75b1-4a83-8d4d-cf258de0d3f0', 'd48352a3-f11c-4fac-aee8-9443adb8a733', '200db22f-b194-4bd7-9485-a799febbf2db', '6ea4f896-8f6e-4e95-9751-e1bad37e10b2', 'f704e922-ad3d-4cba-a54a-c1cbda8203dc', '2f822d19-327a-4092-a057-2cb2d707c402', '2d94f936-7b6a-4114-9f4e-efdba474f2c7', '49b56163-d8f8-4e2e-9936-a62bc3f89546']","['cobol-modernization__8vAyvUW', 'cobol-modernization__voNGk79', 'cobol-modernization__hFGp8G7', 'cobol-modernization__zyRnYcp', 'cobol-modernization__ZZTEnnp', 'cobol-modernization__mVkyLiR', 'cobol-modernization__y8cFfGF', 'cobol-modernization__LY4p2h5']",7,"[240.765361, 315.53184, 919.19774, 478.885807, 435.361757, 133.045817, 904.295166, 957.879926]","[20.071883, 21.261415, 97.190245, 21.985842, 34.688208, 9.051838, 49.208325, 10.398741]",0.875,True,"['311b3138-75b1-4a83-8d4d-cf258de0d3f0', 'd48352a3-f11c-4fac-aee8-9443adb8a733', '200db22f-b194-4bd7-9485-a799febbf2db', '6ea4f896-8f6e-4e95-9751-e1bad37e10b2', 'f704e922-ad3d-4cba-a54a-c1cbda8203dc', '2f822d19-327a-4092-a057-2cb2d707c402', '2d94f936-7b6a-4114-9f4e-efdba474f2c7']" +claude-opus-4-1-20250805,code-from-image,8,"['3171e92f-94fd-48e4-aafa-a31948aac168', 'af3ae81f-df7c-4270-9ecf-a0aa24a03b75', '3158c005-9fc2-4761-bf22-aaa84e59462b', 'da87cd0e-5791-4a97-a839-15b884240b3f', 'bfab6d2d-8b17-4530-b95d-706c2cffb57f', '444230cf-b35b-4c74-ba14-dd6ebbd853c9', 'fde3398d-cc4c-414e-9a9d-6305304b8886', '1f1d6ef1-be2e-4ef5-907f-c13ab80724c4']","['code-from-image__fpTLRzf', 'code-from-image__FYUQor6', 'code-from-image__CV5VFpy', 'code-from-image__3naE2uh', 'code-from-image__jajJMW5', 'code-from-image__oSBy7YW', 'code-from-image__pnweBGN', 'code-from-image__fpiDNpY']",1,"[747.059007, 1210.201027, 1204.245047, 238.054528, 1220.200444, 1202.099865, 1200.002843, 1971.751474]","[38.745609, 12.386194, 9.739847, 9.284186, 148.435505, 51.664637, 21.221227, 24.339548]",0.125,False,['3171e92f-94fd-48e4-aafa-a31948aac168'] +claude-opus-4-1-20250805,configure-git-webserver,8,"['c3775e21-dc38-4cbf-8093-c659a6ffca66', 'f159c79d-2470-48aa-8a61-edcd0f7b70c4', '0448e7e9-533e-4e5c-833a-5e2f0f0812c6', '0f838bbd-e6f7-4ae4-9f82-3ff6f4fbd817', '7151285d-ca87-4f88-a1da-731b3a7e85fb', '4e8f60c0-b75a-4f48-9b67-1db360c1a653', 'eccd6e7a-5624-422c-bd9e-a779204856e7', '83274880-deb9-49e4-b1b1-bae3269b994c']","['configure-git-webserver__A8NmEaP', 'configure-git-webserver__U9E73Dz', 'configure-git-webserver__iveiPjG', 'configure-git-webserver__okmgbPc', 'configure-git-webserver__9jPNCkD', 'configure-git-webserver__84swWiY', 'configure-git-webserver__FxcV42o', 'configure-git-webserver__D3Sfavh']",5,"[125.583902, 83.241783, 99.638185, 511.925172, 416.718266, 549.973132, 506.423469, 523.431272]","[13.39298, 14.884282, 20.195418, 81.557999, 162.642391, 64.533977, 36.182426, 17.876043]",0.625,True,"['0448e7e9-533e-4e5c-833a-5e2f0f0812c6', '0f838bbd-e6f7-4ae4-9f82-3ff6f4fbd817', '7151285d-ca87-4f88-a1da-731b3a7e85fb', '4e8f60c0-b75a-4f48-9b67-1db360c1a653', 'eccd6e7a-5624-422c-bd9e-a779204856e7']" +claude-opus-4-1-20250805,constraints-scheduling,9,"['0e9c10ae-cd82-4afc-b329-c70d9552ec0d', 'd768fac9-7968-492f-8224-5ede70c87908', '21dc4950-581a-43c9-b9c0-3ef43be39b36', '0afcfa0b-7968-4c38-b0ec-90c0a0c96859', '4cf44c0c-500b-4e52-ab57-70ed854d001e', '77daed4f-a7a5-4e5b-8ff7-6cc5a9746454', 'bd872ef7-223c-41c5-b1db-1ffc0197c52b', '128bf28d-0794-4e84-8142-32f5736c5329', '4fef5661-ba2f-4530-8cb4-97c9cdcac8b5']","['constraints-scheduling__XmDSm7C', 'constraints-scheduling__GFFgPoj', 'constraints-scheduling__GCuuPWw', 'constraints-scheduling__4xj3KBp', 'constraints-scheduling__LLVyDSa', 'constraints-scheduling__z6Zwief', 'constraints-scheduling__oivUhZL', 'constraints-scheduling__34mubXZ', 'constraints-scheduling__hiPrEnd']",8,"[335.54073, 199.218903, 365.262643, 86.497593, 379.176898, 109.424085, 533.379048, 154.718894, 125.657312]","[46.25222, 24.204957, 122.242623, 11.774248, 71.18909, 33.632721, 209.221583, 25.589739, 11.048622]",0.8888888888888888,True,"['0e9c10ae-cd82-4afc-b329-c70d9552ec0d', 'd768fac9-7968-492f-8224-5ede70c87908', '21dc4950-581a-43c9-b9c0-3ef43be39b36', '0afcfa0b-7968-4c38-b0ec-90c0a0c96859', '4cf44c0c-500b-4e52-ab57-70ed854d001e', '77daed4f-a7a5-4e5b-8ff7-6cc5a9746454', '128bf28d-0794-4e84-8142-32f5736c5329', '4fef5661-ba2f-4530-8cb4-97c9cdcac8b5']" +claude-opus-4-1-20250805,count-dataset-tokens,8,"['428e829a-0c30-48ec-ad8d-a31fd4be7d49', '2a6609c0-65b1-47f6-abb1-b00fef77a766', '1f312ef1-eb47-4a2c-bd3e-73e67b672605', '60f187bc-4a5c-4215-863f-8d6be168cf4f', '1f0839c9-5660-4b3b-8d7f-c9a033e50aec', 'bf5b9ab7-080c-4c78-93ec-76e703a888e1', '0623dc91-fa40-4bca-977d-22980b15e100', '2e2165f4-2983-4238-b452-a2f86d005921']","['count-dataset-tokens__XCq3ufz', 'count-dataset-tokens__CcFiADs', 'count-dataset-tokens__tDxpPw7', 'count-dataset-tokens__HyyHbmM', 'count-dataset-tokens__7KaJgpC', 'count-dataset-tokens__CZwZMQo', 'count-dataset-tokens__Sw3xj8Z', 'count-dataset-tokens__dy9AGQf']",0,"[170.811476, 176.177157, 306.541506, 917.745426, 175.192597, 480.764525, 279.409725, 550.255913]","[30.463449, 10.251717, 14.059175, 90.382923, 10.468349, 65.933046, 26.354453, 24.838594]",0.0,False,[] +claude-opus-4-1-20250805,crack-7z-hash,9,"['f518223a-567a-41ab-9390-086a69abdc56', 'f7eb3c92-6b46-4021-8a20-a109bb54dd22', 'e6da1840-fb0a-4ca6-b4d7-7d60410e7218', 'd69ca7d1-2fd8-4f4e-95d1-6a1c66bf68fe', '432c868e-25b4-4359-95af-dbb34a4b2d7d', '7f16a20d-a5f5-49bf-86f9-b0239a6436ed', 'c1e68c21-c76a-4e73-b2ab-d8aa37fd5c83', '7176447e-59c1-4860-96a9-d5da2c401656', '5ad4e3f0-a931-423e-bfec-3ecc95d8d189']","['crack-7z-hash__GRXeyiH', 'crack-7z-hash__CWVA2nB', 'crack-7z-hash__znyqLvR', 'crack-7z-hash__XyPZ9vZ', 'crack-7z-hash__zrf3SKZ', 'crack-7z-hash__8UBpKJG', 'crack-7z-hash__7itEjE7', 'crack-7z-hash__zfyob22', 'crack-7z-hash__pCbd7N4']",8,"[581.221997, 574.585282, 685.795384, 581.434339, 556.88633, 356.500901, 217.612309, 604.683938, 386.362799]","[14.738917, 21.618166, 27.633118, 25.830998, 68.511287, 14.766236, 8.210009, 14.531256, 17.635864]",0.8888888888888888,True,"['f518223a-567a-41ab-9390-086a69abdc56', 'f7eb3c92-6b46-4021-8a20-a109bb54dd22', 'e6da1840-fb0a-4ca6-b4d7-7d60410e7218', 'd69ca7d1-2fd8-4f4e-95d1-6a1c66bf68fe', '432c868e-25b4-4359-95af-dbb34a4b2d7d', '7f16a20d-a5f5-49bf-86f9-b0239a6436ed', '7176447e-59c1-4860-96a9-d5da2c401656', '5ad4e3f0-a931-423e-bfec-3ecc95d8d189']" +claude-opus-4-1-20250805,db-wal-recovery,9,"['735b85e1-43ce-4cab-bd9a-5be2a1441d5c', '54d1e8fc-3838-4bb7-a068-256012fe8d8e', '8b907b58-54b4-4dcc-a0ee-d64b91e12c1e', '185c144f-e5f0-4413-8a71-980d641d7b3a', '0e13e697-d4f5-4793-a157-a6aa3222e48a', 'e5ef1524-6e3b-4942-86a2-39bbb2b0813c', '638a5d66-5dc4-4ba6-828a-123a901983c1', 'effe30ab-2890-475b-ade0-263e7ea87865', '26f30ad3-b0e4-4531-939c-1c03f9d6dcdc']","['db-wal-recovery__qQ9jPbM', 'db-wal-recovery__muWDCpv', 'db-wal-recovery__5uDeLMt', 'db-wal-recovery__M5MtZLx', 'db-wal-recovery__jgvfeVi', 'db-wal-recovery__VsqHLcf', 'db-wal-recovery__67xnjhf', 'db-wal-recovery__PLdLiWL', 'db-wal-recovery__2JgYJRT']",0,"[500.045358, 506.926065, 587.430964, 364.409, 876.161393, 249.388615, 254.539664, 1003.965977, 904.844732]","[24.436683, 59.48416, 27.489177, 10.991076, 25.55269, 15.763446, 10.641735, 24.319528, 12.873081]",0.0,False,[] +claude-opus-4-1-20250805,distribution-search,9,"['c648a06e-140c-4bf5-b25d-3e1774847bc4', '688d7dc2-3636-4358-9a68-4241ee609984', '91e02959-3ec2-4409-be19-40fd8e445ee3', 'b7ecbc3c-5b5c-4eef-b2c2-ec3a3814483a', 'b961da7e-a721-4c05-b52b-75e8b035f040', 'ad53aa1f-22d8-4b8d-a25b-89bec1c9a99e', '2affbd25-6505-4fa8-8919-0d29c8e0ceb7', '826e77bb-4c7c-4e30-b881-40c31a6b208d', '5ca8ef08-5382-4f65-8487-2872c9840b17']","['distribution-search__7kMEgBV', 'distribution-search__CLVLT9B', 'distribution-search__akhinvg', 'distribution-search__fcQopFU', 'distribution-search__8MjHR7H', 'distribution-search__hkf2RbD', 'distribution-search__RY4Qq3a', 'distribution-search__84FYwf7', 'distribution-search__mmj5ysW']",5,"[1513.986603, 3601.873857, 2382.451914, 896.313803, 987.774852, 3600.002506, 256.920603, 3674.152675, 335.200085]","[9.101118, 16.958356, 8.643579, 49.415187, 226.926724, 9.907281, 15.203385, 207.345396, 21.650897]",0.5555555555555556,True,"['c648a06e-140c-4bf5-b25d-3e1774847bc4', '91e02959-3ec2-4409-be19-40fd8e445ee3', 'b7ecbc3c-5b5c-4eef-b2c2-ec3a3814483a', 'b961da7e-a721-4c05-b52b-75e8b035f040', '2affbd25-6505-4fa8-8919-0d29c8e0ceb7']" +claude-opus-4-1-20250805,dna-assembly,8,"['5854f038-62dd-4075-ab0a-13f36ff088f4', '9c1ede3e-f4ae-426d-a6a0-be7be1d2816d', '8d3d070d-8515-4ad5-b7f0-936792fc7074', '270fff03-dd54-4da2-8a11-0404be30a5ab', '0dfb13e5-503a-4d44-a304-9c8914aa3460', '10a98bb8-8450-48b0-a062-1703ff8840c9', 'f096ea2b-5bf4-4561-9ac0-ada3f19112c0', 'da128935-f806-4adf-abb7-ecacc7e7071a']","['dna-assembly__mXYJc8C', 'dna-assembly__wqNwUPy', 'dna-assembly__jfXeg6C', 'dna-assembly__DAgsuby', 'dna-assembly__hmvgXYJ', 'dna-assembly__M2MrvdK', 'dna-assembly__UcMbBmo', 'dna-assembly__cWVCS8y']",0,"[511.076769, 285.310443, 720.510238, 728.300629, 724.926875, 624.445139, 754.891937, 734.660342]","[17.065019, 17.090219, 217.180605, 43.021908, 29.584385, 16.2608, 32.902254, 95.819925]",0.0,False,[] +claude-opus-4-1-20250805,dna-insert,8,"['83d46178-f3cb-416a-989b-674ac1c8c59b', 'ab0f99bb-4d7f-4c79-b44d-07f86e76514a', '7cc81acf-c15b-4148-bd0e-e82fc04c9447', 'a2d67299-86f3-451a-9c1d-48d3e8068626', 'e3d8f8d3-1789-4e6b-874c-61483ca81b7b', 'ec1bb383-d44f-4b55-a845-c1ccf8b411fc', 'eef21312-014e-480f-9a90-aee2d4bb6178', 'c9365468-fe97-4ae1-9c36-4a88b69a5628']","['dna-insert__XdFpUMr', 'dna-insert__bY7DLGr', 'dna-insert__Bho5mFJ', 'dna-insert__PBvQdLj', 'dna-insert__6CjCicC', 'dna-insert__3TNa6iT', 'dna-insert__ATR5igC', 'dna-insert__gx5neSs']",0,"[366.177928, 219.451668, 145.54479, 360.012105, 360.001079, 360.000856, 360.748988, 375.049858]","[54.465628, 16.468533, 19.584376, 73.564314, 26.151386, 29.76714, 20.165464, 13.944993]",0.0,False,[] +claude-opus-4-1-20250805,extract-elf,9,"['6756bf43-ec57-4ec9-806e-5c4663836e90', '802d403e-5284-4a8f-9d89-bbb6008a6805', '8ce8262e-647f-4f46-9120-2f75ca722077', 'd73d427c-a78a-47a5-8994-5c1b06869a3e', '8f78de3c-61dd-43a5-a8fa-d6cbc706b597', 'a1e18589-587a-436e-bb26-1c2b2f166a92', 'd85a7cf9-ca2e-4ac6-902d-46171722c69d', 'a8be5d3c-96d8-4a69-a1a5-830ba102fa74', 'fac83c01-9bc6-4848-9eb8-d837ac6bb292']","['extract-elf__keQciKG', 'extract-elf__cCqXgbn', 'extract-elf__HsjfnJt', 'extract-elf__SK5tEHu', 'extract-elf__uAcNS4n', 'extract-elf__yeJwru5', 'extract-elf__yMFaQ6N', 'extract-elf__otFQggf', 'extract-elf__7EuqH8h']",8,"[232.32937, 128.555051, 132.109921, 323.859053, 251.076883, 495.15662, 226.238576, 158.103233, 372.45689]","[26.648638, 9.359082, 9.420419, 13.777933, 18.169198, 67.847461, 22.338121, 23.01251, 35.833494]",0.8888888888888888,True,"['6756bf43-ec57-4ec9-806e-5c4663836e90', '802d403e-5284-4a8f-9d89-bbb6008a6805', '8ce8262e-647f-4f46-9120-2f75ca722077', 'd73d427c-a78a-47a5-8994-5c1b06869a3e', '8f78de3c-61dd-43a5-a8fa-d6cbc706b597', 'd85a7cf9-ca2e-4ac6-902d-46171722c69d', 'a8be5d3c-96d8-4a69-a1a5-830ba102fa74', 'fac83c01-9bc6-4848-9eb8-d837ac6bb292']" +claude-opus-4-1-20250805,feal-differential-cryptanalysis,8,"['16042bc7-3c75-495d-b562-021f08b2a053', '101f0de8-a65c-40d2-bfef-5c194785c5bb', '1657b0c7-a2a6-4dab-bad7-9fcb89e0b152', 'c6ed2b83-0586-4bda-8ec7-9132960f515d', 'ce530fcb-77da-4c3f-b7ed-4696d0fe9d11', '9ca2a341-893f-412c-a423-c4d6cd8c16bb', '09b42e7f-972f-4e3c-b529-d8ec69fbf33a', 'cb6f4975-6a02-4803-b454-ea657ccb1af1']","['feal-differential-cryptanalysis__NBkEePV', 'feal-differential-cryptanalysis__a5KdBC5', 'feal-differential-cryptanalysis__saR73da', 'feal-differential-cryptanalysis__rj7Bpx9', 'feal-differential-cryptanalysis__6XxnkiA', 'feal-differential-cryptanalysis__diQcUmd', 'feal-differential-cryptanalysis__hjAy9sh', 'feal-differential-cryptanalysis__iDebQDp']",0,"[1807.272191, 1800.001205, 1800.332737, 1869.677587, 1800.001361, 1800.001022, 1801.241135, 1813.928094]","[41.850502, 10.062464, 107.954756, 269.101767, 9.348346, 15.586222, 9.467321, 10.63294]",0.0,False,[] +claude-opus-4-1-20250805,feal-linear-cryptanalysis,9,"['16cc88fa-70e7-4db8-9c81-2ed8f543f4d1', 'c76eb7ec-e7bc-48ed-bec1-6905f5fea61d', 'edc946cf-9f32-47dc-82bf-06aeac0a763d', '9081549d-9bef-4a44-b0fe-f5e760f1e4cb', '387a5334-b5d8-47ca-a0fa-6cd76ae1a07f', '954b12e0-f84f-49fd-b97e-1fce9cd819ea', 'f21a3760-fafb-4596-a9bf-846b1afa2ce4', 'c3faf798-b109-4f60-acf0-434a79257b56', '03e0ce95-b78e-410e-a460-481644c3887a']","['feal-linear-cryptanalysis__q9Zw93T', 'feal-linear-cryptanalysis__e8BSDVd', 'feal-linear-cryptanalysis__pG6EcUT', 'feal-linear-cryptanalysis__7SKNspp', 'feal-linear-cryptanalysis__pGKwZKs', 'feal-linear-cryptanalysis__YwuKsV9', 'feal-linear-cryptanalysis__zej2YJf', 'feal-linear-cryptanalysis__oUcFkeP', 'feal-linear-cryptanalysis__v9qjx7T']",0,"[1800.000444, 1800.005004, 1800.225201, 1800.509458, 1802.532733, 1803.370024, 1814.22546, 1803.415785, 1807.988643]","[9.913686, 9.162457, 30.663401, 26.862661, 23.202262, 69.260679, 27.726454, 28.511357, 381.882402]",0.0,False,[] +claude-opus-4-1-20250805,filter-js-from-html,9,"['4edc8459-8675-459f-a195-a3a956bbc1c2', '8bb9a620-8e27-44eb-8d55-5dd9ad106f92', '5130b763-6a79-4f2f-9081-7479fdcc89eb', 'aadfbb61-677b-40af-a7d3-5147a44aecf7', '0d0ac6a1-3a52-47f9-a160-cef281679c0e', 'd05ac18f-8183-4bf9-8da0-5f15f07c3997', 'dc5ead54-0bd0-4d4c-b205-16942ee6b0b3', '98ea32dd-cd49-49ab-a20f-77aea9e90139', 'e33a5b98-49ca-4c9e-a02c-48a3a278d976']","['filter-js-from-html__K6J626y', 'filter-js-from-html__gx3dWGZ', 'filter-js-from-html__5Cd9ChD', 'filter-js-from-html__4NPTKu9', 'filter-js-from-html__Ey8M6wv', 'filter-js-from-html__Q6zCe2f', 'filter-js-from-html__jEgh7RF', 'filter-js-from-html__AJCbyMx', 'filter-js-from-html__77iJhiA']",0,"[687.531898, 214.033549, 497.97139, 244.716243, 297.129012, 340.037855, 853.078775, 199.584844, 909.1637]","[84.376482, 7.202769, 171.683365, 6.847697, 9.008618, 19.438356, 43.69296, 6.650014, 73.25183]",0.0,False,[] +claude-opus-4-1-20250805,financial-document-processor,8,"['5c3560d2-ca9d-453a-9a17-aa4b022d72b1', 'a6547ec3-3f6d-4bcc-b07c-9355a18c0c33', '6f84fb8d-5818-4974-968d-064bbd6990d0', '171affe1-ba43-49da-86b0-969956d3ab68', '647be2a0-189c-4619-bb02-51c65e5199bd', '1c1e07c9-754b-4a7f-8f06-9ee94e507748', '9d6947ee-7536-4e7f-b42f-15862c392708', '27ddeb92-460d-49e7-bf3d-4766e7c41341']","['financial-document-processor__UK2jGer', 'financial-document-processor__vGjatwp', 'financial-document-processor__Lb9G4n7', 'financial-document-processor__9955mfV', 'financial-document-processor__uKEsVCG', 'financial-document-processor__wmhxfKU', 'financial-document-processor__X64MRo3', 'financial-document-processor__qb5abjU']",0,"[433.509708, 409.223505, 748.892467, 499.256021, 318.867634, 193.840313, 471.766738, 517.630565]","[301.243769, 44.346574, 15.689611, 111.903752, 253.870982, 19.842579, 31.91913, 16.568276]",0.0,False,[] +claude-opus-4-1-20250805,fix-code-vulnerability,8,"['0755df59-ef1d-41bb-a1fb-d251cf47523e', 'adb67505-f120-4d11-a68f-68a9689ee93f', '2e826f40-86e4-4c76-a38a-72e7b3d3155a', '0e261ee6-9a2b-403e-9689-ee95fca29725', '5b39977e-c4a3-4cdb-9e7c-878dcab0d1a5', '4b1fd819-805b-43c9-9afe-8ac46704b634', 'a8c719a9-8eeb-411a-b548-42c304ac9193', '0739d1f9-915a-4389-9bbc-fc4d35fab3ae']","['fix-code-vulnerability__Aj9hULg', 'fix-code-vulnerability__MbCCTmm', 'fix-code-vulnerability__PWj9DRQ', 'fix-code-vulnerability__EzUkCJB', 'fix-code-vulnerability__aHUVP4E', 'fix-code-vulnerability__YAejLZa', 'fix-code-vulnerability__tT3NMGz', 'fix-code-vulnerability__ZPaV8kV']",1,"[295.388928, 900.460466, 273.411887, 645.203066, 952.519263, 980.795787, 900.000752, 563.285081]","[3.224027, 76.048322, 1.671939, 1.998695, 11.598941, 60.158905, 4.466733, 46.033419]",0.125,False,['2e826f40-86e4-4c76-a38a-72e7b3d3155a'] +claude-opus-4-1-20250805,fix-git,9,"['d70d915e-a962-4b22-a008-67afe232d46d', '3b02795e-22c0-432b-90d8-703d409b8807', '08fe0f55-973a-4ff6-8852-e2fa4abd7068', '36ea7088-bfc1-47d5-bb8c-3ee8b1a24501', '4e730c48-1027-46e4-8b31-b2663734536d', '8f18950b-6520-4516-9d58-e1a6f82cdc34', '6445caef-5deb-4dee-89b3-d502ddbe7e71', '449e75d6-874d-4db1-986f-1ef70401564b', '11022477-f3c9-42ca-9d3e-1a0c7f2e4938']","['fix-git__tmJzMkK', 'fix-git__Eg5fvF6', 'fix-git__cbsRsro', 'fix-git__f5whSpZ', 'fix-git__6gAxHjW', 'fix-git__BR5g4wG', 'fix-git__EMqMpSb', 'fix-git__nAqcywS', 'fix-git__9E9wXjS']",9,"[235.71115, 215.462981, 82.930545, 69.302587, 52.513478, 140.710414, 173.755913, 94.675205, 250.800174]","[66.44288, 32.508883, 62.105616, 7.757144, 9.279287, 29.894652, 47.626513, 13.37588, 103.853177]",1.0,True,"['d70d915e-a962-4b22-a008-67afe232d46d', '3b02795e-22c0-432b-90d8-703d409b8807', '08fe0f55-973a-4ff6-8852-e2fa4abd7068', '36ea7088-bfc1-47d5-bb8c-3ee8b1a24501', '4e730c48-1027-46e4-8b31-b2663734536d', '8f18950b-6520-4516-9d58-e1a6f82cdc34', '6445caef-5deb-4dee-89b3-d502ddbe7e71', '449e75d6-874d-4db1-986f-1ef70401564b', '11022477-f3c9-42ca-9d3e-1a0c7f2e4938']" +claude-opus-4-1-20250805,fix-ocaml-gc,8,"['6ab64a24-d963-4053-8f17-ffc44ae48c97', '1d4e99e1-3062-4b25-839a-18b3e1d9179c', 'c7b00e2a-235a-4a13-8741-815937b1d10d', '42d71610-09fb-4716-ad4b-d376e95eca25', '3fcff4d2-19a0-40ed-8ffd-2e7a86783840', '41f13e8c-1b7a-4684-96a4-fbd14fdadeac', '7111a952-bb48-4637-bcc5-90e2b2a6e645', '905cb864-7a06-47d4-a7cc-bfa647e1d097']","['fix-ocaml-gc__7fvprQr', 'fix-ocaml-gc__JS7p93s', 'fix-ocaml-gc__zmNP8Sd', 'fix-ocaml-gc__4xRzQJ4', 'fix-ocaml-gc__FdWm6ZH', 'fix-ocaml-gc__ardpjcD', 'fix-ocaml-gc__aRzAN2V', 'fix-ocaml-gc__nTEUPGq']",4,"[2913.531335, 2020.377457, 1770.354747, 3605.734469, 3681.242939, 3600.001989, 2914.706675, 3604.894393]","[13.531729, 251.332851, 38.421508, 59.608992, 61.519353, 19.485185, 20.673138, 14.663975]",0.5,False,"['6ab64a24-d963-4053-8f17-ffc44ae48c97', '1d4e99e1-3062-4b25-839a-18b3e1d9179c', 'c7b00e2a-235a-4a13-8741-815937b1d10d', '7111a952-bb48-4637-bcc5-90e2b2a6e645']" +claude-opus-4-1-20250805,form-filling,8,"['81d164d0-a2d4-4114-92d9-c46365ba523c', 'c191e077-3d47-465c-84df-b42e5c0cfc1b', '3302e888-31c8-4c5e-ac13-658696faaac2', '614fbc14-f301-4bef-bd3b-ab65e6b16d17', '0c465521-c4c7-4803-ab13-d77a9d9f8e23', '849de4bd-8ee5-4870-a8f0-5e15aa773c50', 'deea11ee-e07b-48aa-9b4d-332fc6a95b5d', '0661b9b4-0109-4776-b308-0e28b6c83ada']","['form-filling__9yn9ozp', 'form-filling__y5DQc3b', 'form-filling__MkRNX3Q', 'form-filling__Goxunkd', 'form-filling__j9F8B3w', 'form-filling__5fSZkDS', 'form-filling__f5VRMoH', 'form-filling__4o2Z4Ly']",8,"[152.590298, 258.675238, 644.983843, 253.895368, 700.345711, 209.095213, 647.561332, 228.118926]","[1.710635, 10.611345, 15.192752, 5.246657, 1.632401, 9.849313, 19.09403, 3.921144]",1.0,True,"['81d164d0-a2d4-4114-92d9-c46365ba523c', 'c191e077-3d47-465c-84df-b42e5c0cfc1b', '3302e888-31c8-4c5e-ac13-658696faaac2', '614fbc14-f301-4bef-bd3b-ab65e6b16d17', '0c465521-c4c7-4803-ab13-d77a9d9f8e23', '849de4bd-8ee5-4870-a8f0-5e15aa773c50', 'deea11ee-e07b-48aa-9b4d-332fc6a95b5d', '0661b9b4-0109-4776-b308-0e28b6c83ada']" +claude-opus-4-1-20250805,git-leak-recovery,9,"['79c5c17d-a4e3-4af1-84f5-e1c8f19d6005', '740ccc3f-2bab-4d1b-a3c5-08734da0daca', '0daff0df-347c-43d7-aec9-94141316e1cf', '8c29090d-c415-4479-b812-8694e1524f1f', 'e5db8d0b-3435-4784-bcab-a68bac2c70f7', 'd0d9f21c-f0e4-46a9-9f67-789abecb4913', '2bc302ce-858c-469e-b020-a19d8072bc85', '3efe6916-87ec-4504-a41f-579d3ef31013', '9191c061-94bc-4190-a7ff-d9bac3e10a5c']","['git-leak-recovery__GmKKwoc', 'git-leak-recovery__BRqZeBA', 'git-leak-recovery__kXZnbuM', 'git-leak-recovery__tYsZbTD', 'git-leak-recovery__6GYKjKk', 'git-leak-recovery__x7SJx2F', 'git-leak-recovery__YkxpQga', 'git-leak-recovery__FFTdM8P', 'git-leak-recovery__4uh5jFN']",9,"[135.387313, 85.344766, 245.159802, 228.257215, 147.709571, 119.716484, 230.848446, 80.871534, 316.178437]","[83.838545, 14.345175, 22.595414, 33.682185, 23.103529, 16.515379, 42.550382, 30.155117, 56.705631]",1.0,True,"['79c5c17d-a4e3-4af1-84f5-e1c8f19d6005', '740ccc3f-2bab-4d1b-a3c5-08734da0daca', '0daff0df-347c-43d7-aec9-94141316e1cf', '8c29090d-c415-4479-b812-8694e1524f1f', 'e5db8d0b-3435-4784-bcab-a68bac2c70f7', 'd0d9f21c-f0e4-46a9-9f67-789abecb4913', '2bc302ce-858c-469e-b020-a19d8072bc85', '3efe6916-87ec-4504-a41f-579d3ef31013', '9191c061-94bc-4190-a7ff-d9bac3e10a5c']" +claude-opus-4-1-20250805,gpt2-codegolf,8,"['8a1640df-dad4-4f97-9c51-a6f305b4f582', 'd2f9865a-fc4c-4150-b3f2-1e1050e37e80', 'b3550fce-5075-475f-8e97-3c1f16b8db77', '4133e8c0-bf92-4b53-9436-3ddec9417aad', '7aa9233a-eb99-4bc1-b8fd-f0ceeef3c326', '07146589-b046-4b5c-bdc1-6aa2f0b412d5', 'c9e92c24-2d05-4b52-9314-5ab7406e0b9d', 'c28cdaed-8325-4300-a093-0ee1246bdeec']","['gpt2-codegolf__ogJKjSY', 'gpt2-codegolf__DT4zsFK', 'gpt2-codegolf__6zUppwT', 'gpt2-codegolf__DThnsCG', 'gpt2-codegolf__vCSEyqm', 'gpt2-codegolf__DTjsBob', 'gpt2-codegolf__ZAp3pYJ', 'gpt2-codegolf__363QB3b']",0,"[900.099502, 917.690204, 1018.917097, 900.149939, 900.002203, 900.035935, 907.131468, 1116.660261]","[65.918184, 93.06181, 20.449778, 17.679411, 13.81553, 117.209005, 293.22754, 20.48828]",0.0,False,[] +claude-opus-4-1-20250805,hf-model-inference,8,"['b07b256a-1949-489f-8763-b2329326d1fc', '15165a39-69c1-4c0f-bf4c-71bf15f19fea', '4a773c2d-70aa-42cb-a1d4-e39de686e077', 'ab827028-5277-457f-a17e-f2346fe6297d', '36687ea4-d7af-4cba-90d2-aee7f7799c6d', 'dfd2e2db-cb2d-49cb-8c1e-5679d9ac78d2', '461e9c0b-d5bd-4190-9776-b621a9e8c217', '7a6e8762-3089-43db-916a-80eeb0ad1e75']","['hf-model-inference__w5LR89q', 'hf-model-inference__LZ3qi5d', 'hf-model-inference__VvTXKrE', 'hf-model-inference__n8CWE3H', 'hf-model-inference__z4ase3R', 'hf-model-inference__pBB3uyJ', 'hf-model-inference__tF3mB9k', 'hf-model-inference__vZfWAVC']",2,"[616.661995, 955.236685, 578.428453, 412.360843, 151.56206, 442.837949, 467.603847, 171.021963]","[103.750154, 28.55365, 9.344793, 39.65871, 11.465248, 18.578117, 65.756169, 14.263104]",0.25,False,"['dfd2e2db-cb2d-49cb-8c1e-5679d9ac78d2', '7a6e8762-3089-43db-916a-80eeb0ad1e75']" +claude-opus-4-1-20250805,install-klee-minimal,8,"['2e2adf0f-ee9f-4f3c-b1c3-fff4213ae2dd', '1fa7a8d7-eb31-4308-b71b-2075a92e0f51', '669853d5-65f0-4664-b562-f36c14dbc973', 'c931cdb9-5ce8-4b57-b843-3ac1c8db6239', '5a9d07ee-1578-4478-ab8d-a7f6ed0ed766', '49a0f346-d0fe-4181-9206-7555273b326d', '7f1cc64b-59f1-4690-bd6f-3110aface092', 'f871f347-cd99-4582-a001-5031520a1252']","['install-klee-minimal__jmxwsJQ', 'install-klee-minimal__7v5J7iu', 'install-klee-minimal__TBEchxZ', 'install-klee-minimal__HfyL6CH', 'install-klee-minimal__vvAEnUu', 'install-klee-minimal__FLciAiP', 'install-klee-minimal__SFXF4pt', 'install-klee-minimal__R8abQay']",0,"[901.186887, 923.610495, 900.190278, 913.912962, 900.136276, 900.000637, 900.001134, 900.78486]","[58.579442, 38.218308, 96.3023, 10.525982, 59.321506, 8.922705, 13.36233, 101.572888]",0.0,False,[] +claude-opus-4-1-20250805,install-windows-3.11,6,"['f9d1aa7d-8bbd-440b-b0e0-fe8c09438f66', 'de70038d-df71-4088-88cf-dad0dab039bb', 'bf307024-8734-4d0e-8c24-4acf679c85f4', '3b2d1976-9460-496c-a928-0049485853db', 'd5a46021-57bc-4ce5-a770-79e6a2983a79', '8012e1aa-9396-481c-8a5f-f0178fe489c8']","['install-windows-3.11__vucpzeT', 'install-windows-3.11__5BptGH5', 'install-windows-3.11__4cUXLgh', 'install-windows-3.11__2MuZXQ6', 'install-windows-3.11__kz7EfzC', 'install-windows-3.11__Kf7i2g8']",0,"[272.578105, 267.745773, 177.77918, 3645.10536, 1084.320907, 1165.921848]","[42.276618, 10.231451, 17.936021, 46.291957, 14.042912, 19.411312]",0.0,False,[] +claude-opus-4-1-20250805,large-scale-text-editing,9,"['3efd40f7-5f58-4f53-a526-6ecc65feed68', 'ffc9fe52-e07e-4726-a42a-94151ebf1e33', '118d8122-b389-4dae-ab44-9c4ac8e97334', 'c8b5b68b-7386-4a2c-8763-7a2078e51065', '44489547-cc5c-4603-92da-ea05b00d257c', 'e9eb0c87-6b8c-43df-8784-3b95411ad258', '3daed4e6-68fc-45d1-a338-c8a13c8c0aff', 'b9d66ccb-9b32-438c-b927-5e722433abb6', '05629046-aff2-4cbf-9d23-56a27678c9cd']","['large-scale-text-editing__s3YAPiR', 'large-scale-text-editing__gyq9KoM', 'large-scale-text-editing__hv4BZFE', 'large-scale-text-editing__cgnCu6w', 'large-scale-text-editing__LYTvqG6', 'large-scale-text-editing__Ydk2EAW', 'large-scale-text-editing__pUaNjry', 'large-scale-text-editing__bFbdS9q', 'large-scale-text-editing__3ZMnicF']",6,"[669.653332, 460.53846, 816.861871, 315.583443, 535.524466, 872.432357, 1526.991126, 1200.002049, 630.958542]","[11.511646, 89.917409, 22.882445, 11.671262, 13.495132, 17.004219, 61.078304, 11.465349, 358.286696]",0.6666666666666666,True,"['3efd40f7-5f58-4f53-a526-6ecc65feed68', 'ffc9fe52-e07e-4726-a42a-94151ebf1e33', '118d8122-b389-4dae-ab44-9c4ac8e97334', '44489547-cc5c-4603-92da-ea05b00d257c', '3daed4e6-68fc-45d1-a338-c8a13c8c0aff', '05629046-aff2-4cbf-9d23-56a27678c9cd']" +claude-opus-4-1-20250805,largest-eigenval,8,"['aec7d125-de2a-4b3b-926f-7e168a8c803c', 'a46e4b00-776a-41de-82f2-681a009a697f', '08aa8b62-6dfb-4abe-8dbb-a2e8d79d0bb9', '4598f8be-a0a2-458e-a31c-d59dd56154cf', '0f07f8aa-5e00-4c24-9503-1de0f62835fd', '63fba954-9d7d-4241-a98c-56f5d5b65ca6', '4dc9ff61-d034-433a-b3f2-d4d2d343f008', 'ea5c814f-e991-49a6-9c5f-8730cf12e4fe']","['largest-eigenval__bPvfRTU', 'largest-eigenval__DUkpbA7', 'largest-eigenval__5drUwQh', 'largest-eigenval__dsmuXji', 'largest-eigenval__XwcbLK4', 'largest-eigenval__YYsse8W', 'largest-eigenval__5qiANzP', 'largest-eigenval__qzw3B5n']",2,"[949.746904, 902.021514, 901.361522, 906.470496, 292.508897, 900.000739, 900.002217, 1507.487635]","[40.598477, 33.949573, 130.156763, 204.104556, 11.089038, 9.767386, 82.343406, 10.907832]",0.25,False,"['a46e4b00-776a-41de-82f2-681a009a697f', '0f07f8aa-5e00-4c24-9503-1de0f62835fd']" +claude-opus-4-1-20250805,log-summary-date-ranges,9,"['332fda31-b86e-48ec-9534-4476b6259ac2', 'c77b43a3-de6f-41f8-8500-a23196b70b3e', '00aaeee6-eb73-4c06-a1a5-5290f6acb3d7', '8969b231-a1a2-423b-815e-4bf4cf94ae76', '0e10cbd2-d2d5-45ea-bbfe-d51cb746b91a', 'e32f9fe1-5b8a-45be-9a7b-03e466bfe776', '60563665-81a2-4c58-9559-9e6948a1f35b', '5b16a7e3-80c6-4b7a-be8a-d47f977c7ce0', '58c6c3e7-e6f0-4623-9824-f2e8ceb587d8']","['log-summary-date-ranges__9E5k67Z', 'log-summary-date-ranges__QUu8t3u', 'log-summary-date-ranges__FiJvj5o', 'log-summary-date-ranges__Fv87mVA', 'log-summary-date-ranges__2DjT33q', 'log-summary-date-ranges__kpiN5j3', 'log-summary-date-ranges__NSUPhGa', 'log-summary-date-ranges__DCtc52a', 'log-summary-date-ranges__cPXqUyr']",8,"[82.01714, 171.94883, 295.41452, 91.415281, 87.704572, 138.376435, 160.536924, 109.058518, 106.694388]","[13.030224, 21.042713, 171.20404, 11.260408, 11.265233, 29.212379, 21.534735, 35.913269, 102.412332]",0.8888888888888888,True,"['c77b43a3-de6f-41f8-8500-a23196b70b3e', '00aaeee6-eb73-4c06-a1a5-5290f6acb3d7', '8969b231-a1a2-423b-815e-4bf4cf94ae76', '0e10cbd2-d2d5-45ea-bbfe-d51cb746b91a', 'e32f9fe1-5b8a-45be-9a7b-03e466bfe776', '60563665-81a2-4c58-9559-9e6948a1f35b', '5b16a7e3-80c6-4b7a-be8a-d47f977c7ce0', '58c6c3e7-e6f0-4623-9824-f2e8ceb587d8']" +claude-opus-4-1-20250805,make-doom-for-mips,9,"['97ecf028-b6af-45fe-b1c6-3779feb26b1a', '7f59c512-03fe-4737-9774-375f98faaf12', '15870bad-0bd8-4d33-91f3-40e29dca24a7', 'db70010f-83b4-4ed7-befe-bb8920099f7e', 'e032ad69-aba7-40f8-aee1-d6bd8a312d6c', 'c6db3522-30a1-4c34-ae7d-d1f85dc74cd7', 'f035797c-385c-4a15-a365-1927717a372c', '135617bc-1e75-4d46-a1f7-d793a1cb25f5', '7c4b329b-fcb9-4c02-b624-f14c79413f6c']","['make-doom-for-mips__X92GQCE', 'make-doom-for-mips__jZYf645', 'make-doom-for-mips__XE5P7Ro', 'make-doom-for-mips__QLTSg3g', 'make-doom-for-mips__hDoAuwU', 'make-doom-for-mips__CENTJ4d', 'make-doom-for-mips__gfp3hwA', 'make-doom-for-mips__xsJK4Ab', 'make-doom-for-mips__g2KpVkF']",0,"[901.917677, 906.140076, 926.68805, 900.000328, 900.90212, 900.001982, 900.003115, 900.024907, 900.000987]","[215.033039, 38.947822, 10.47501, 28.065174, 14.19276, 83.427916, 8.845601, 53.175365, 10.345446]",0.0,False,[] +claude-opus-4-1-20250805,make-mips-interpreter,7,"['0f0849a5-65df-49c6-b2e3-7fd6c61f8d54', '3520488f-e4de-4191-9494-7d44164f44eb', 'd95b0ca4-5134-4a1e-b994-44f7f3fabcb1', '775c5cd7-3231-475c-9df8-285ce29f09b4', '324c3702-7add-4ca9-9e24-7acbfa13fb4b', '4742659e-e25f-4c30-9da9-928a55c4abe5', 'b376b093-070b-4b0f-bf81-05d08cac6d49']","['make-mips-interpreter__9WeXGJ2', 'make-mips-interpreter__EwaW2v7', 'make-mips-interpreter__qFdrCQP', 'make-mips-interpreter__8JyJHpk', 'make-mips-interpreter__WkKG258', 'make-mips-interpreter__9gYN3WH', 'make-mips-interpreter__UwvaqfP']",0,"[1800.001671, 1804.123265, 1800.000866, 1800.101062, 1801.350194, 2074.425933, 1815.706967]","[19.176593, 228.755224, 6.750287, 99.635532, 31.085533, 10.642213, 9.759231]",0.0,False,[] +claude-opus-4-1-20250805,merge-diff-arc-agi-task,9,"['e12bf8e9-f9f7-409e-87ff-8f5279ce8c8e', '998d54e9-c88c-4c19-93e6-258e91576be6', '51484877-d0db-4b4a-88da-c949886f9792', '73737a5a-df7a-4cfb-aa78-6e119fc6b6f2', 'b32993da-a8b6-42d7-8e0f-bfcdd006fd9e', '3fc364b4-bc33-49df-8469-ea7143b0a987', '9cf8b8a1-8103-43ff-9678-b5f38e2f9192', '5d1e7eb3-5bdd-4a30-b678-91776bc0907b', '491fea6e-e16d-489a-b98b-4b61473c3046']","['merge-diff-arc-agi-task__qZBE8G2', 'merge-diff-arc-agi-task__aKvxhs2', 'merge-diff-arc-agi-task__v62TNey', 'merge-diff-arc-agi-task__zZmnHSV', 'merge-diff-arc-agi-task__iQZAusu', 'merge-diff-arc-agi-task__rYXDDcB', 'merge-diff-arc-agi-task__7LYPySQ', 'merge-diff-arc-agi-task__N2UctBL', 'merge-diff-arc-agi-task__QPHKeGn']",3,"[217.071652, 198.706254, 473.351028, 297.197773, 917.497024, 950.452803, 905.644947, 265.488601, 905.178974]","[16.979948, 19.224254, 28.964679, 19.96496, 45.239145, 89.352401, 98.227747, 16.737375, 14.1767]",0.3333333333333333,False,"['e12bf8e9-f9f7-409e-87ff-8f5279ce8c8e', '998d54e9-c88c-4c19-93e6-258e91576be6', '73737a5a-df7a-4cfb-aa78-6e119fc6b6f2']" +claude-opus-4-1-20250805,model-extraction-relu-logits,8,"['6f998f7a-7b71-41f9-ae98-cce082d8cd38', 'bdfb249c-9ee6-4b39-b04b-e2539ff5659a', '2edfe09c-c286-49d1-962e-efa450cccca0', 'bbbcde4e-4818-4fdd-b157-8308131ad128', '488e2534-e402-4199-a97d-8430240bca4d', 'eefad2e0-7cd5-4e46-ac53-01536000f05c', 'bdcadd99-bd58-415a-8d89-6bbaa2e9b102', 'f345537c-9e8e-4dbe-a16f-4dd271c4fb7c']","['model-extraction-relu-logits__VZEwtuD', 'model-extraction-relu-logits__aWDnoCW', 'model-extraction-relu-logits__oUiJFnv', 'model-extraction-relu-logits__rRt5kYi', 'model-extraction-relu-logits__AN3Ljim', 'model-extraction-relu-logits__ZbipMj4', 'model-extraction-relu-logits__eKQxqGh', 'model-extraction-relu-logits__RqEGASK']",0,"[266.633976, 578.998697, 182.227921, 584.547492, 156.784934, 900.009188, 440.001537, 592.310242]","[10.720606, 10.025338, 11.861693, 79.377595, 103.896455, 152.070003, 27.975216, 48.485641]",0.0,False,[] +claude-opus-4-1-20250805,mteb-leaderboard,8,"['d778b3e1-fea8-4591-85c5-1c5e30b77431', 'cdb5f530-a060-4479-acd7-63786decb16a', '59c845bf-6cb8-4d6f-83ef-5f79804aa926', 'd78235e2-f26c-426e-8a05-31ff921c5021', '544404d7-6db5-436d-8bf8-8e55f26cf8e4', '2443e660-db36-4114-9128-f562d8b33d02', 'c6deceed-6bc5-4ad7-b6dc-8e3fc4237632', '0843612c-441a-484f-8a8f-4151d2859afd']","['mteb-leaderboard__xFMgVh6', 'mteb-leaderboard__ZCSZUzy', 'mteb-leaderboard__wEkULgL', 'mteb-leaderboard__Ucz6ceM', 'mteb-leaderboard__NazcemX', 'mteb-leaderboard__obBQvwa', 'mteb-leaderboard__G2utesu', 'mteb-leaderboard__WLpeEJG']",0,"[202.93684, 97.987328, 457.663343, 116.844017, 309.443283, 405.67755, 894.546868, 353.952331]","[5.696391, 2.624427, 1.685592, 37.443775, 89.804695, 2.686064, 111.350791, 24.939464]",0.0,False,[] +claude-opus-4-1-20250805,mteb-retrieve,8,"['0220641a-d71e-4f0a-8291-a2593b84812b', '99e8d69c-0ab0-4634-80d7-8b00781584ad', 'e2f35e70-9e70-4ef9-a116-e7ac7ca5034c', '5aa1749d-6029-4ce2-aec5-ce433919311a', 'c09d888f-0f84-42af-bd81-9307a68008a2', '29bb5dda-d5ab-4de6-bda7-8c5f7fc74c9a', 'b7afad3d-dd86-4ed6-b18a-414d587b9270', '45fb63d0-b46d-4509-96d1-d546be30b372']","['mteb-retrieve__WqRdZRe', 'mteb-retrieve__fQAmxAb', 'mteb-retrieve__KhW77kN', 'mteb-retrieve__BBnSM4R', 'mteb-retrieve__hXv7miZ', 'mteb-retrieve__6e4xxQe', 'mteb-retrieve__XTB5dDY', 'mteb-retrieve__mhi6ZFY']",0,"[51.32253, 226.049896, 567.384364, 284.420526, 81.395991, 208.507572, 388.133686, 81.147327]","[3.58378, 28.902261, 7.417042, 28.214903, 1.745259, 2.887758, 4.886118, 3.593722]",0.0,False,[] +claude-opus-4-1-20250805,nginx-request-logging,8,"['079e5015-34b3-4245-96a2-9b06d49fb7af', 'b557d6c8-aaa1-445d-b152-788af54e5051', '962d07e7-d0f8-4c21-899a-64c2684d4d5f', '11bccd25-6a06-4148-81fe-cfc088994109', '56292ed4-7a0f-4cc3-b7bf-7df32bdee0f1', '46820140-4540-4cfc-8572-0432c2a52f2b', '0bd9dc97-39fb-44b8-81bd-e2e101ee0ac2', '27a8702b-d1da-4726-a171-bc8d243b5976']","['nginx-request-logging__U9SLcsL', 'nginx-request-logging__bx78cMk', 'nginx-request-logging__5Aams4h', 'nginx-request-logging__PzNaj7j', 'nginx-request-logging__xphabfR', 'nginx-request-logging__JFcsRpJ', 'nginx-request-logging__LwtzEzY', 'nginx-request-logging__w6ufYcx']",8,"[129.801722, 233.265661, 100.328306, 638.090941, 113.874251, 176.619626, 383.576773, 159.488286]","[11.165791, 58.475013, 11.144743, 56.830884, 14.443069, 69.973103, 42.11132, 14.520228]",1.0,True,"['079e5015-34b3-4245-96a2-9b06d49fb7af', 'b557d6c8-aaa1-445d-b152-788af54e5051', '962d07e7-d0f8-4c21-899a-64c2684d4d5f', '11bccd25-6a06-4148-81fe-cfc088994109', '56292ed4-7a0f-4cc3-b7bf-7df32bdee0f1', '46820140-4540-4cfc-8572-0432c2a52f2b', '0bd9dc97-39fb-44b8-81bd-e2e101ee0ac2', '27a8702b-d1da-4726-a171-bc8d243b5976']" +claude-opus-4-1-20250805,openssl-selfsigned-cert,8,"['521a60cb-9f6b-4c83-a43b-02f40515200d', 'ca57e394-4100-407f-bb74-c786c14b52ed', '6ae836ef-016c-4891-9b0e-f83f7f89513a', 'fe3a0b41-9395-42e0-8625-6b2ea3dffa72', '8fcb3879-147c-4629-9b41-e6ceaa3e8e95', '4e79cccb-31ed-4c37-8513-1b85cffe9dc7', 'e26d29ea-d474-4d51-bc8f-43acaeff5d38', 'be97065c-6e2b-4566-bbca-80b37fd00ec3']","['openssl-selfsigned-cert__y9aQzQH', 'openssl-selfsigned-cert__8kUSNpC', 'openssl-selfsigned-cert__GBTjhnv', 'openssl-selfsigned-cert__9i73zwq', 'openssl-selfsigned-cert__HgRi7De', 'openssl-selfsigned-cert__NveFb85', 'openssl-selfsigned-cert__23xbRCn', 'openssl-selfsigned-cert__VqReeWv']",8,"[169.691858, 106.913432, 356.479367, 96.531413, 682.712621, 88.764477, 439.035807, 279.75366]","[26.963898, 22.364745, 47.760304, 9.77757, 113.932955, 91.187023, 88.409709, 23.736288]",1.0,True,"['521a60cb-9f6b-4c83-a43b-02f40515200d', 'ca57e394-4100-407f-bb74-c786c14b52ed', '6ae836ef-016c-4891-9b0e-f83f7f89513a', 'fe3a0b41-9395-42e0-8625-6b2ea3dffa72', '8fcb3879-147c-4629-9b41-e6ceaa3e8e95', '4e79cccb-31ed-4c37-8513-1b85cffe9dc7', 'e26d29ea-d474-4d51-bc8f-43acaeff5d38', 'be97065c-6e2b-4566-bbca-80b37fd00ec3']" +claude-opus-4-1-20250805,password-recovery,9,"['0e0a518a-f4e3-4459-be23-003886ce1e09', '364b4a60-23d4-4181-a183-b09e3bf200be', 'a8978a4e-9d89-4216-a5dd-1797f34e28e0', '060e3775-b180-4a6d-85c2-055f115ddffd', '9ac272c7-b675-438c-9fb0-0fb33578266b', '8ad142c9-01e7-46b4-9230-6c982b8e8741', 'f4c2b1da-0e84-44bc-8a9d-f5285191d55d', '59a45a77-b0fc-4bd8-8fde-4f2435ccc621', '793ee697-ef3b-4b0f-9016-e88a254d8fa0']","['password-recovery__Mf5hERr', 'password-recovery__ABKUBw3', 'password-recovery__CXb5jPU', 'password-recovery__pe9NUs3', 'password-recovery__wa6u6ak', 'password-recovery__Qw6aWcj', 'password-recovery__paaE5pf', 'password-recovery__HnYom6Z', 'password-recovery__qiFJwsj']",5,"[902.500883, 260.188883, 321.28878, 638.741134, 907.853543, 869.559788, 900.000778, 667.830922, 1666.356108]","[60.015259, 32.868132, 20.65572, 15.406862, 60.206618, 41.846468, 16.33534, 58.752535, 69.427811]",0.5555555555555556,True,"['0e0a518a-f4e3-4459-be23-003886ce1e09', '364b4a60-23d4-4181-a183-b09e3bf200be', 'a8978a4e-9d89-4216-a5dd-1797f34e28e0', '8ad142c9-01e7-46b4-9230-6c982b8e8741', '59a45a77-b0fc-4bd8-8fde-4f2435ccc621']" +claude-opus-4-1-20250805,path-tracing,7,"['edee0c76-d82a-46ae-957f-c8308f041175', '0746c0de-34ec-481b-b047-43df4731a485', '5978e7ea-58bd-4d7d-985d-f47af32519db', '47f85501-bf1c-4cab-9bcb-7ae60f184f2c', '65dc8e91-4011-4262-81ff-276fa36d6d43', '345e8069-8623-4b60-b391-40b3a0cb7995', '1d4e692a-7b19-48b3-8a23-e7dc8987a42f']","['path-tracing__aZ6SwDC', 'path-tracing__m2cbGad', 'path-tracing__bTxFmQR', 'path-tracing__i4kcH2D', 'path-tracing__fvi4dsu', 'path-tracing__dNkXUqR', 'path-tracing__GHhKVsQ']",0,"[1859.136666, 1800.001086, 1804.230985, 1811.064664, 977.47282, 974.599841, 969.49986]","[32.144658, 20.666943, 124.499525, 93.429658, 45.254034, 13.662253, 39.399583]",0.0,False,[] +claude-opus-4-1-20250805,path-tracing-reverse,8,"['a4493ced-0ed1-4aa5-8299-5e3459fc8484', '29d35c51-fe74-4323-afe2-47f6905decc5', '2be54584-afd4-4ae8-add6-38e332bbf922', 'bae64056-e81b-4a90-91f0-2550c3b16c62', 'ebcc6278-5a5a-44bb-9781-6921c6f38b29', '55c63350-ca20-495f-8913-fd1456b1b903', 'a6255b02-f02a-435f-ae05-d19267f26323', '7d2ac3a4-cb2d-4946-83ef-26fbd46733b9']","['path-tracing-reverse__3tmBq53', 'path-tracing-reverse__ZqkcTGH', 'path-tracing-reverse__hsTBEUG', 'path-tracing-reverse__fWWct5o', 'path-tracing-reverse__4bciBbp', 'path-tracing-reverse__AAGZGrs', 'path-tracing-reverse__Q9fQRt7', 'path-tracing-reverse__3ttux8h']",0,"[1800.000917, 1800.001767, 1810.128392, 1800.001176, 1800.032101, 1839.759531, 1809.098062, 1800.000681]","[12.131472, 17.136054, 152.392579, 42.022906, 147.094035, 91.168399, 41.444799, 14.39006]",0.0,False,[] +claude-opus-4-1-20250805,polyglot-c-py,8,"['57c2f529-8569-4f7c-a775-20eb7625dbba', 'cff297dc-7d6b-4018-b305-fc0f39d79384', '0612a6b7-c7a4-4478-873b-d3d8a36c0905', '2056f705-23a7-4bc5-9a40-e65cd1988135', '226a31d3-0056-476c-a5d3-25a53d667a34', '39e7cc9c-87a2-456e-877e-823d6b7a57c5', 'a86dab73-5d7f-40b5-846d-f55ce1e0800a', '880c4b46-6ff8-47b3-be62-85063c9f4441']","['polyglot-c-py__4dEVCBE', 'polyglot-c-py__FiUGLrH', 'polyglot-c-py__oeaesHA', 'polyglot-c-py__KtcVadv', 'polyglot-c-py__brT9Nyr', 'polyglot-c-py__Sz7dbq8', 'polyglot-c-py__M5Z29wi', 'polyglot-c-py__iyd6Xuf']",0,"[206.43158, 181.783692, 232.122145, 823.248162, 413.786451, 138.02483, 478.509961, 527.587911]","[15.706834, 18.019086, 32.774772, 37.366635, 14.96676, 43.733409, 35.120041, 21.625336]",0.0,False,[] +claude-opus-4-1-20250805,polyglot-rust-c,7,"['b8900719-c08f-4987-a32b-10fdf84a0d7a', '674ca55c-5d16-41e2-8feb-00222cb89955', 'c89e0420-4761-467c-b267-37aedc652e7a', '7ad03ceb-6e84-452f-8bf9-d79866746e59', '6fb4566d-018c-4fa4-8a43-ce2db8257d10', '1acf53de-645b-44d6-b21a-b341b97f795c', '289ebe1c-5513-447d-b30c-4c4ccda1d500']","['polyglot-rust-c__GLwPjML', 'polyglot-rust-c__RFrbEVq', 'polyglot-rust-c__dbgrvuw', 'polyglot-rust-c__PjEoMSb', 'polyglot-rust-c__ibA3xPc', 'polyglot-rust-c__bB553ss', 'polyglot-rust-c__isLdG2D']",0,"[900.000976, 914.193253, 1007.816809, 900.002896, 900.502842, 900.685443, 931.888686]","[19.852527, 134.616231, 334.634617, 270.548061, 78.396164, 49.04118, 65.453164]",0.0,False,[] +claude-opus-4-1-20250805,port-compressor,6,"['e9b5848b-52fc-4b61-8203-242f2fde4b19', '1178f2ce-aa25-4ec5-a591-edcc4f737bdc', 'a24f81e8-ad4b-4d0f-8af9-0adf522a359e', '391e5177-45a2-4255-92a7-0b602b13533a', 'cba087b9-c691-428c-bb32-5aa41cb92bfb', 'af66c2c3-feaf-47d2-925c-2906af9af0c6']","['port-compressor__Vsrh8DJ', 'port-compressor__8qU43gs', 'port-compressor__rwuVxeD', 'port-compressor__XjVYZAP', 'port-compressor__kXMZvog', 'port-compressor__kFA6LjP']",0,"[3613.633762, 3921.859939, 3600.594592, 3633.895463, 3600.001374, 3600.040973]","[44.747803, 179.202731, 19.377769, 103.777628, 32.619792, 117.633025]",0.0,False,[] +claude-opus-4-1-20250805,prove-plus-comm,9,"['5f19aed8-745f-4ecc-a3c8-ccd641e44220', 'a65d8adf-242f-44c0-ab05-37be5a37fc1f', '82c0fa3f-e29d-4316-8519-2e2b3df4b562', '36df6a28-2cf1-4861-aa2f-08ce10a5e1d7', 'ab13dc61-78ac-4385-959a-74ca8e55d71b', '0860c205-ef2b-4e3e-8f5d-94353bd75f3f', '6a506db4-fff4-4ef8-91e8-f75521b0f3f0', '88a3db08-0124-4fa4-b5a2-3230e5b9b19d', '366d9ddc-1f62-46ec-b15d-321cc1672d20']","['prove-plus-comm__o2evUDT', 'prove-plus-comm__zJBJNEQ', 'prove-plus-comm__ryouz3G', 'prove-plus-comm__BuSSXDi', 'prove-plus-comm__KQGYqJy', 'prove-plus-comm__S5BE3Wt', 'prove-plus-comm__XnNXbay', 'prove-plus-comm__K78MXPU', 'prove-plus-comm__t54mGtu']",9,"[300.181889, 117.069819, 91.096263, 159.007377, 49.434102, 42.635086, 116.805302, 203.618837, 38.496605]","[60.010562, 11.201447, 24.398995, 57.080405, 14.179289, 10.968438, 38.608591, 141.514648, 12.033393]",1.0,True,"['5f19aed8-745f-4ecc-a3c8-ccd641e44220', 'a65d8adf-242f-44c0-ab05-37be5a37fc1f', '82c0fa3f-e29d-4316-8519-2e2b3df4b562', '36df6a28-2cf1-4861-aa2f-08ce10a5e1d7', 'ab13dc61-78ac-4385-959a-74ca8e55d71b', '0860c205-ef2b-4e3e-8f5d-94353bd75f3f', '6a506db4-fff4-4ef8-91e8-f75521b0f3f0', '88a3db08-0124-4fa4-b5a2-3230e5b9b19d', '366d9ddc-1f62-46ec-b15d-321cc1672d20']" +claude-opus-4-1-20250805,pypi-server,8,"['cd0ffe4c-b7b6-4827-a327-2d34d1b0b6ad', '4e117788-96a1-4cb6-b13f-6f4f89d29c5d', 'bd628078-7615-4358-b535-a3418a3ae5af', '225cdc57-9105-4e38-a05c-d0fc666c5d48', '92ee607c-d2de-4065-9f06-7aa0eb79dbf3', '2f8b3898-a48b-442d-ae15-96af001754e9', 'cafdbbf5-ede2-433a-99a2-62361ceb0346', 'd9bc6c4a-5bd7-4ee1-a032-d56d5e72a6d9']","['pypi-server__W9HTEYu', 'pypi-server__93Um2xf', 'pypi-server__XucRvop', 'pypi-server__7DaQRkg', 'pypi-server__z2FoyFw', 'pypi-server__4s6WG3u', 'pypi-server__3f4fxat', 'pypi-server__SwNJUtU']",8,"[111.040107, 290.260019, 127.156995, 245.695786, 331.972522, 152.529616, 486.381509, 189.164504]","[8.119267, 133.745448, 63.412607, 211.315672, 67.728801, 8.18225, 104.900146, 41.459755]",1.0,True,"['cd0ffe4c-b7b6-4827-a327-2d34d1b0b6ad', '4e117788-96a1-4cb6-b13f-6f4f89d29c5d', 'bd628078-7615-4358-b535-a3418a3ae5af', '225cdc57-9105-4e38-a05c-d0fc666c5d48', '92ee607c-d2de-4065-9f06-7aa0eb79dbf3', '2f8b3898-a48b-442d-ae15-96af001754e9', 'cafdbbf5-ede2-433a-99a2-62361ceb0346', 'd9bc6c4a-5bd7-4ee1-a032-d56d5e72a6d9']" +claude-opus-4-1-20250805,pytorch-model-cli,7,"['b95dc6a4-4397-45b5-88b3-6f7579459425', '9965d685-d878-4b90-88ea-70d1a885c6ca', 'db7c15c9-a7f1-4297-8b07-ab8c56a333eb', 'bfa3ff3d-20f5-4f74-baf1-8a3eb13a3e60', 'be64ed93-47b3-4cb4-94d3-55d1b9f6da75', '7834d5ab-94f9-4788-86ae-8f87782982cc', '456e82cb-028e-40a4-b978-e5aa0e6ef84d']","['pytorch-model-cli__G2EPP4s', 'pytorch-model-cli__d4uzxdx', 'pytorch-model-cli__taMvbR5', 'pytorch-model-cli__Str9DJS', 'pytorch-model-cli__EGZWp7k', 'pytorch-model-cli__Tgz3NCe', 'pytorch-model-cli__kiGyng7']",3,"[496.116245, 191.97382, 584.181164, 638.278229, 900.510233, 494.763512, 379.893183]","[79.660132, 10.736439, 80.597106, 9.893991, 63.671566, 17.15363, 95.177207]",0.42857142857142855,False,"['b95dc6a4-4397-45b5-88b3-6f7579459425', '9965d685-d878-4b90-88ea-70d1a885c6ca', 'bfa3ff3d-20f5-4f74-baf1-8a3eb13a3e60']" +claude-opus-4-1-20250805,pytorch-model-recovery,8,"['e1f3454c-6284-4983-bfe5-99d1d71346de', 'f9abff12-4f9a-4bd6-8f18-523bff9e1f91', 'c9c3597b-0e71-44a6-a06e-f8939153956a', '395a8fdb-2b7a-48be-b3b8-859453c704cb', '5a265616-32cd-42ad-a8d4-896899dd9b88', '6a1b95d7-3235-4bcf-bf84-e3a8d67beb3f', '55714eef-d2c2-4210-ba57-a7c3728c5304', '8da9f4bf-1222-4d0a-b6fa-fc34823bf024']","['pytorch-model-recovery__2g3yKHK', 'pytorch-model-recovery__6Xh3tsK', 'pytorch-model-recovery__Dv4AYtD', 'pytorch-model-recovery__DbM8qvB', 'pytorch-model-recovery__ZCgp2bd', 'pytorch-model-recovery__vvgh8kS', 'pytorch-model-recovery__cemQoEe', 'pytorch-model-recovery__XwqPtNg']",8,"[511.260645, 900.001341, 192.191495, 235.176575, 902.330004, 902.161826, 274.897067, 309.337275]","[9.983849, 22.0232, 9.895771, 14.275868, 102.256251, 24.879071, 37.588913, 48.908343]",1.0,True,"['e1f3454c-6284-4983-bfe5-99d1d71346de', 'f9abff12-4f9a-4bd6-8f18-523bff9e1f91', 'c9c3597b-0e71-44a6-a06e-f8939153956a', '395a8fdb-2b7a-48be-b3b8-859453c704cb', '5a265616-32cd-42ad-a8d4-896899dd9b88', '6a1b95d7-3235-4bcf-bf84-e3a8d67beb3f', '55714eef-d2c2-4210-ba57-a7c3728c5304', '8da9f4bf-1222-4d0a-b6fa-fc34823bf024']" +claude-opus-4-1-20250805,qemu-alpine-ssh,7,"['2b0b634a-4a78-46d9-bbd5-62dc9b0efc36', 'fb214946-32fa-44de-b847-b2475aba59bd', '6be48d70-e23f-4453-a59f-1bd47017efef', 'dfe57fb1-f712-413d-a882-bbabad11d763', 'dc23566d-cd26-41f3-bbe1-27643dd3b562', '042e788b-5cbb-44b0-bbbd-de0b43132101', '538ab4e3-24e2-442f-9a5c-640189bd2e46']","['qemu-alpine-ssh__CEYpp7C', 'qemu-alpine-ssh__EGiexBr', 'qemu-alpine-ssh__ZqYhMAW', 'qemu-alpine-ssh__zQEay8s', 'qemu-alpine-ssh__EF5j68q', 'qemu-alpine-ssh__v9GKmSA', 'qemu-alpine-ssh__CuDvT6c']",6,"[287.888495, 303.443405, 452.760669, 216.84273, 289.950868, 1009.953127, 512.544333]","[10.794074, 76.408898, 1.999155, 2.230988, 9.368822, 5.487902, 23.110526]",0.8571428571428571,True,"['2b0b634a-4a78-46d9-bbd5-62dc9b0efc36', 'fb214946-32fa-44de-b847-b2475aba59bd', '6be48d70-e23f-4453-a59f-1bd47017efef', 'dfe57fb1-f712-413d-a882-bbabad11d763', 'dc23566d-cd26-41f3-bbe1-27643dd3b562', '538ab4e3-24e2-442f-9a5c-640189bd2e46']" +claude-opus-4-1-20250805,qemu-startup,7,"['1bc493ca-b967-454b-810a-8e4ea750c986', 'fc8c6c13-7325-4e9f-9801-af2bbe1f7dca', '9069b432-4864-445c-97a0-9e3bfd53b36d', '9751ac0e-851c-46aa-9285-8305f9ff064f', 'cfff69ab-a6f0-481d-9b87-b97201fe2019', '9580118a-58f2-45ae-bb53-04306b57af3a', '92d87607-8518-49f3-8a78-162038017ad1']","['qemu-startup__ZzBHbyJ', 'qemu-startup__Gd7rMRp', 'qemu-startup__SPYPwW5', 'qemu-startup__CLphKEK', 'qemu-startup__bYcNNP3', 'qemu-startup__BptfwKg', 'qemu-startup__AMHmFS4']",3,"[593.711255, 296.10671, 397.317461, 153.667311, 963.542424, 180.506271, 272.279236]","[4.392153, 9.985626, 1.767614, 2.119714, 37.000361, 26.333797, 2.91501]",0.42857142857142855,False,"['1bc493ca-b967-454b-810a-8e4ea750c986', '9580118a-58f2-45ae-bb53-04306b57af3a', '92d87607-8518-49f3-8a78-162038017ad1']" +claude-opus-4-1-20250805,regex-log,7,"['5f2aef4b-b0b8-4748-9fe2-300b50550ede', 'cec472fd-4d5a-45c9-8be9-bf71e0c16b49', '6f5d093d-532d-4bd3-8671-32dbd351be28', 'addd0bd5-a563-49f6-a282-6c99346f08d9', '80cbfbe0-3393-477c-a13f-21a2753d2ce5', 'b83d72b2-807e-4d72-9e83-03a2f325debc', '750995cc-8759-4aea-a1c7-08a418cde7f7']","['regex-log__vsB5abN', 'regex-log__piAvCV7', 'regex-log__eHSouqS', 'regex-log__QTPbiwS', 'regex-log__QNMXnSw', 'regex-log__WM6N83R', 'regex-log__vJyj3ew']",4,"[128.282453, 198.077775, 92.971109, 368.250988, 302.706542, 159.970616, 156.21718]","[151.259042, 238.98513, 15.870314, 32.559299, 159.250051, 21.24613, 20.624084]",0.5714285714285714,True,"['cec472fd-4d5a-45c9-8be9-bf71e0c16b49', '6f5d093d-532d-4bd3-8671-32dbd351be28', 'b83d72b2-807e-4d72-9e83-03a2f325debc', '750995cc-8759-4aea-a1c7-08a418cde7f7']" +claude-opus-4-1-20250805,reshard-c4-data,7,"['e5e25819-3c72-4a40-8beb-4a8dbc7d2eac', '68b352f1-22f0-4fcb-896a-4febdd537cc7', '41634c72-f817-4506-aa31-7e4de3ed8582', '5e8c653c-38b7-4ccd-981e-0b5df6419bbd', 'f1af89f2-a910-427c-9636-b47e1804994a', 'b786acb0-2081-4b74-9fa4-9e996d8700a5', '8d444c6a-f2de-49ed-a52c-787b1a48ef4b']","['reshard-c4-data__aQjCHFE', 'reshard-c4-data__onUF5Xb', 'reshard-c4-data__Dy29qGT', 'reshard-c4-data__u83WmzR', 'reshard-c4-data__S5N3RvJ', 'reshard-c4-data__im7VDxB', 'reshard-c4-data__ioeCi6B']",0,"[797.980871, 599.941002, 900.00652, 900.005734, 1729.501661, 294.257391, 580.075365]","[308.909622, 15.912248, 58.124409, 10.011973, 48.054598, 47.552137, 120.793836]",0.0,False,[] +claude-opus-4-1-20250805,reverse-engineering,8,"['451ba60c-f495-47a5-8934-d6d19e399f0f', '97915e07-1d7f-451b-b269-19cd05f766ea', 'c9ddcf11-fd31-42b7-8145-25d70f524a1e', '25083454-81a4-4057-8b40-deefef05a2c6', 'cee3d65f-9bd2-4b70-bb24-0a6d7ecd589b', '455c0a68-89d0-4c39-b0f6-ca8ccaf3d0fc', 'bfbb578c-3528-4b98-90a3-0c3fd270aacd', '7a68bcc8-7580-42c5-97a1-aa507493420e']","['reverse-engineering__V64KoMj', 'reverse-engineering__9yQ9SVt', 'reverse-engineering__CRddZS3', 'reverse-engineering__woBrvni', 'reverse-engineering__zgXd4mf', 'reverse-engineering__B6ej3VS', 'reverse-engineering__EsAin8W', 'reverse-engineering__TSFQmsv']",0,"[1801.516985, 1800.238053, 1838.021957, 1895.828497, 2612.21751, 746.129547, 1802.352125, 1800.012775]","[90.526131, 74.90221, 46.263453, 7.928386, 125.993675, 30.110758, 7.461895, 110.399355]",0.0,False,[] +claude-opus-4-1-20250805,run-pdp11-code,7,"['54bd1fa0-9614-4a84-b82f-ef1c01f98a93', '89986160-f9b2-46e5-886f-ce21d6fafc20', 'ff2d32cc-c8bc-45b4-ad79-92dfc7d1eba4', '6acb8f19-5cdf-4c95-aecd-d333814cbe57', '57141c5b-894c-4a75-8e4f-067bda64fd7d', 'eacbe383-7502-40f8-abae-23c21dcbb715', 'a0031f01-6a37-4035-9c35-49eee635e5cb']","['run-pdp11-code__zj33PaA', 'run-pdp11-code__2LEHKkW', 'run-pdp11-code__69yA6r9', 'run-pdp11-code__HTjxMYR', 'run-pdp11-code__fKBHjNk', 'run-pdp11-code__Zv7FJBX', 'run-pdp11-code__24NL288']",0,"[1013.398577, 414.240595, 599.3209, 1028.544067, 507.681048, 165.716155, 565.655216]","[161.267397, 79.712215, 9.590117, 120.24924, 19.389734, 12.148019, 23.142925]",0.0,False,[] +claude-opus-4-1-20250805,sanitize-git-repo,8,"['c80ab1b4-fece-438c-bb05-c636e0237956', 'fd2b6ce1-0aa5-4571-b797-2598558a0832', '468d8c01-08f0-45ea-8cf3-e912e6067987', 'f92162b0-9993-4fa1-bdbf-6388fc8c7f6b', 'ffefb40e-0cac-40e7-8326-2664eb02b251', 'eb81fc2c-2f30-4d57-a29c-dc09b644b08c', '49d55170-3b2d-4372-a4a2-022fe29bde8e', '7f0a2b99-0418-45e8-ba35-b3a6329fc9a0']","['sanitize-git-repo__W8QYmtC', 'sanitize-git-repo__mf8A3tC', 'sanitize-git-repo__RQS5MTH', 'sanitize-git-repo__RDSMbbU', 'sanitize-git-repo__b8zYPxt', 'sanitize-git-repo__S6svTpq', 'sanitize-git-repo__8eFKziw', 'sanitize-git-repo__GFtWT6f']",0,"[903.693157, 1318.237121, 900.00212, 457.052309, 185.532736, 704.858849, 900.000792, 739.137696]","[78.382494, 231.304742, 8.456522, 17.508583, 10.57372, 79.280801, 8.391353, 22.398858]",0.0,False,[] +claude-opus-4-1-20250805,schemelike-metacircular-eval,7,"['01badb25-d302-4572-8890-cbcc60e20851', 'dce2ba82-f078-4743-b4a8-e1ac0ef5a310', 'f0a8e266-432f-44ca-a37d-b9f570968edc', 'bfb78a1a-8f3f-4dcf-bbfa-950deb3b93b7', 'dfa56d12-ef6f-4e49-b7bc-c49bb609d8ee', 'a0bd8ecd-2a8c-4df5-a7c3-b103ee62aff2', '796334c6-e835-43f4-89f1-61f3f311ad64']","['schemelike-metacircular-eval__qZP7WcQ', 'schemelike-metacircular-eval__yLLDeAf', 'schemelike-metacircular-eval__UEP7Tpi', 'schemelike-metacircular-eval__RrqjKRb', 'schemelike-metacircular-eval__2gsbPgX', 'schemelike-metacircular-eval__WU2cktW', 'schemelike-metacircular-eval__TYucTPo']",0,"[896.959935, 2411.786063, 2407.978294, 2403.425143, 2402.266617, 2430.843741, 2400.000996]","[9.56112, 39.925977, 39.848162, 208.937125, 161.957272, 136.059493, 9.542312]",0.0,False,[] +claude-opus-4-1-20250805,sparql-university,7,"['993cd909-95ef-481f-b644-d3c46cce1840', '6cd7b1d2-35af-4397-8206-89be66f54870', '6619ff94-0e5a-4ca5-a78a-38509829de94', 'a3993ccb-771b-455f-8d62-b26d79bb7df5', 'e60beead-339e-4e52-96d0-abc7d794157c', 'aaec1464-2e89-40a3-9cd5-51bf80b9067c', 'a0a4ac18-58f9-4ee7-a142-eab0573b351e']","['sparql-university__bUtiqUh', 'sparql-university__6cfnR4z', 'sparql-university__NkR8oYC', 'sparql-university__4hECtpX', 'sparql-university__fXQ33bX', 'sparql-university__rJ6ZmUh', 'sparql-university__DhFZYX6']",0,"[217.618223, 339.613775, 265.177911, 158.460062, 199.160967, 1065.074529, 59.700205]","[18.803402, 59.212481, 100.175851, 49.516634, 46.898409, 226.11581, 17.011056]",0.0,False,[] +claude-opus-4-1-20250805,sqlite-db-truncate,8,"['c6bca54f-5b6e-407e-99d7-4cba2a003fdb', 'c1f3113e-4637-4c39-9267-d96e952c3130', 'f7dd705a-694e-4d11-95e3-53aadb3f1c91', '9eb795ae-0bc8-4eba-8d97-ce40189a1b00', '7ea95c77-9dbe-4cc8-a350-432681a3394a', '00d2059e-bc80-4347-bb40-9ff7a14e1300', '2decb33d-6acf-44cb-8ab8-12e8905f8e56', '41ec1529-01ef-41f5-b5e3-041fdb80059b']","['sqlite-db-truncate__pdqHobq', 'sqlite-db-truncate__rvxNvax', 'sqlite-db-truncate__eAXBUnU', 'sqlite-db-truncate__ZfsfpWH', 'sqlite-db-truncate__mum9gg7', 'sqlite-db-truncate__TUw3mHN', 'sqlite-db-truncate__YoJAmcK', 'sqlite-db-truncate__AE5AqgG']",1,"[176.837932, 202.628815, 342.057067, 282.38081, 278.391312, 428.757811, 205.694099, 486.648373]","[9.82882, 34.430476, 27.987878, 42.875141, 63.221658, 58.668523, 10.589189, 77.996706]",0.125,False,['f7dd705a-694e-4d11-95e3-53aadb3f1c91'] +claude-opus-4-1-20250805,sqlite-with-gcov,7,"['79af95f8-2276-4ddc-8c39-6a015faa4b2f', '6184b94b-1597-419a-9424-f1278aaffd17', '01c15953-c7e0-404e-a07f-dae9b4ff9c2d', '47376a96-6e41-4876-b0ae-f7cd1f84e43d', '681e04ca-e202-457c-84f8-c6ebc49e9565', '96a421ff-33c8-4354-b3e4-d1f524d69d4e', '79b6aed7-befd-4e44-93b8-09d912819591']","['sqlite-with-gcov__brANnaz', 'sqlite-with-gcov__pqBojYS', 'sqlite-with-gcov__fVnVYoJ', 'sqlite-with-gcov__2GouVgG', 'sqlite-with-gcov__PffByRF', 'sqlite-with-gcov__RieZe5L', 'sqlite-with-gcov__C6idYzM']",4,"[265.550426, 162.582046, 433.157226, 221.163788, 179.5018, 523.373141, 263.510691]","[44.290131, 15.066944, 53.460916, 45.921478, 15.197928, 25.305112, 69.818562]",0.5714285714285714,True,"['79af95f8-2276-4ddc-8c39-6a015faa4b2f', '6184b94b-1597-419a-9424-f1278aaffd17', '47376a96-6e41-4876-b0ae-f7cd1f84e43d', '681e04ca-e202-457c-84f8-c6ebc49e9565']" +claude-opus-4-1-20250805,torch-tensor-parallelism,7,"['9d5422f4-bec8-404d-a9cc-0bf3c605f097', '07cbeece-e396-4b98-9ba3-fb3496789e57', 'dd72bad8-9918-415b-a0cc-c298d137d9eb', '403e777c-5c65-4e6c-b11b-4f4baf37c48f', '01abbe71-2473-4587-bb75-bfe815f7ab5d', 'c35e2f16-6867-405d-b240-2ab7d3bfe85a', '8f7f5dec-c11c-4fe9-a8e4-37d36ca0e51a']","['torch-tensor-parallelism__vSi8FiT', 'torch-tensor-parallelism__Q2GzePX', 'torch-tensor-parallelism__LKiuDMQ', 'torch-tensor-parallelism__XKSb7Gv', 'torch-tensor-parallelism__RsLnP4Z', 'torch-tensor-parallelism__JRXDeD3', 'torch-tensor-parallelism__d7zdQbY']",0,"[488.326042, 147.162879, 146.856933, 88.331873, 50.283946, 45.158359, 801.718159]","[38.202466, 40.079225, 38.959607, 49.619586, 16.419638, 15.271869, 168.605876]",0.0,False,[] +claude-opus-4-1-20250805,train-fasttext,7,"['1656a26b-f7fd-409f-8fd2-3ed781dcde33', 'c8ea837c-b5ca-4bf7-9929-76d1dc27719d', '3b8a6da2-13c5-4ab8-be7b-bbbf279aeae4', 'b0a394fe-201b-46a1-88b6-574265e54ecf', '8fc5545b-8b8e-4763-9d14-dea0c3e11c17', '38bcfac2-4b53-40da-911a-4a7aa19fde6e', '67392217-1422-44be-b7a7-0bc59d5142eb']","['train-fasttext__pnjWzZ7', 'train-fasttext__aUjiURS', 'train-fasttext__QSyBjQd', 'train-fasttext__jrtweNK', 'train-fasttext__PN6vqhK', 'train-fasttext__AfLxd2D', 'train-fasttext__wG3gekV']",2,"[3622.815267, 1977.492241, 3646.901448, 4868.621336, 3605.320573, 3600.000711, 2274.075464]","[57.241074, 64.63663, 20.409991, 22.578477, 28.329511, 9.529693, 14.376272]",0.2857142857142857,False,"['c8ea837c-b5ca-4bf7-9929-76d1dc27719d', '67392217-1422-44be-b7a7-0bc59d5142eb']" +claude-opus-4-1-20250805,tune-mjcf,8,"['b3461fee-2a1a-4539-b33b-5027e4ab3c9f', '0d25dc58-aca6-4096-a523-7d8af94be74e', 'af7efeb7-e8c7-4173-bc05-eb8656230d98', '3e3dcfef-6336-46bd-ace0-0cc25bb10e8a', '129b4526-38e0-42a6-a364-4abe3c127d28', 'd62fa252-d44c-4462-9afd-6b12751c39f1', '69dd84c8-9fd9-4c5c-bf16-8c9a5f840430', '8461b0ef-4b34-470b-a195-ef7d0357f164']","['tune-mjcf__r22aLEb', 'tune-mjcf__QztTAKJ', 'tune-mjcf__VUojMTf', 'tune-mjcf__7rAPFDj', 'tune-mjcf__qYJtJNA', 'tune-mjcf__sZtqC6o', 'tune-mjcf__W2hAZfo', 'tune-mjcf__tHcnv2L']",2,"[907.472763, 900.001224, 970.238686, 1008.545189, 900.009322, 245.90741, 479.479135, 900.200375]","[42.692639, 21.664388, 46.971685, 9.980842, 10.559221, 14.741623, 15.623484, 9.349886]",0.25,False,"['d62fa252-d44c-4462-9afd-6b12751c39f1', '69dd84c8-9fd9-4c5c-bf16-8c9a5f840430']" +claude-opus-4-1-20250805,video-processing,7,"['7a042abc-c91d-4be6-8d68-339839b1af36', '3e00f1f2-f771-4354-9550-ab94b95060d0', '7610a108-98fa-4b7b-9d03-415b142978eb', '4281cf11-3c02-4696-b476-ae86a49c05b4', '45085700-60c5-4a1d-bccc-c26635c6d474', 'dc54abb9-1199-4e64-a5e8-acac9461f2a2', '474fd036-e0d3-458a-b8db-33e23aecf0cb']","['video-processing__QuiJnW5', 'video-processing__FCktrkE', 'video-processing__QwpXwiY', 'video-processing__QoAEHED', 'video-processing__HY8ZxXE', 'video-processing__ETusYP2', 'video-processing__3jniSa8']",0,"[90.555214, 298.359356, 96.72613, 337.285543, 162.099751, 345.855149, 210.560505]","[9.683292, 53.859668, 11.352564, 22.62869, 160.707156, 41.185425, 38.792506]",0.0,False,[] +claude-opus-4-1-20250805,vulnerable-secret,8,"['fe88016b-2e99-4673-bbf0-94506a64653b', '862e23e7-1faa-46ce-9977-5ad58a44800e', 'a14b0b9d-df3b-4a9d-bbd3-8305da6d1cbb', '89c27691-aeea-4d08-84c4-61e55d951d59', '02f46f7e-0aba-4caf-a7f4-c34fb818c903', 'b5b86ea0-4e39-4879-a44f-cad92cb4158f', '637d8a51-12b1-459a-8196-064f13a4e75b', '57e16a6c-7cf6-4ac5-a6da-24b99ba773b4']","['vulnerable-secret__KTpR4Gg', 'vulnerable-secret__eZpnYF5', 'vulnerable-secret__V2Y5NcA', 'vulnerable-secret__3buwUWC', 'vulnerable-secret__Bos2RBk', 'vulnerable-secret__cdgKY5Y', 'vulnerable-secret__4oFDSwW', 'vulnerable-secret__SHdYEPf']",5,"[318.515285, 900.001458, 382.275678, 972.908078, 418.521487, 78.871735, 614.719795, 900.486996]","[12.605305, 64.514706, 21.963248, 72.679368, 11.119325, 8.788546, 13.255706, 65.604878]",0.625,True,"['fe88016b-2e99-4673-bbf0-94506a64653b', 'a14b0b9d-df3b-4a9d-bbd3-8305da6d1cbb', '02f46f7e-0aba-4caf-a7f4-c34fb818c903', 'b5b86ea0-4e39-4879-a44f-cad92cb4158f', '637d8a51-12b1-459a-8196-064f13a4e75b']" +claude-opus-4-1-20250805,wasm-pipeline,7,"['f247293e-2088-4069-80d1-263a5dfec96a', '923ef369-abbd-4591-bfdd-31cd10a0af1d', '375481d8-a9a3-4aaf-b391-db02f50a686e', 'fcd0f26c-31f1-451b-b757-7eb196284dd6', '693b5606-46c3-4bfa-affc-812af6d44357', 'cf660706-c250-4052-ac98-15acccba673f', '20f8ecdd-8f35-473c-879f-4fb08321cb48']","['wasm-pipeline__StsNb6j', 'wasm-pipeline__8xRHU6G', 'wasm-pipeline__iYGi29C', 'wasm-pipeline__XZFGHd4', 'wasm-pipeline__SKjUzGE', 'wasm-pipeline__GxfHuNs', 'wasm-pipeline__DutK98q']",1,"[224.428482, 355.818902, 774.733994, 238.562136, 900.002479, 319.873497, 312.943763]","[8.031601, 20.290195, 14.102035, 1.675604, 2.057794, 4.476901, 5.38346]",0.14285714285714285,False,['fcd0f26c-31f1-451b-b757-7eb196284dd6'] +claude-opus-4-1-20250805,winning-avg-corewars,6,"['df842bec-2878-45f0-a123-7a8a5132dd70', 'b9509375-fdf5-4f21-b8ce-6fcf3c767742', '13a8e061-4a0f-4183-95fb-28fc4783fc64', 'f1c98275-ca46-489c-9643-8f4889df9e67', '3366ff69-5908-47e2-be01-e1c302821e48', '3a8d151e-ffac-43d4-8e25-f1e9c3240654']","['winning-avg-corewars__vUpVCiW', 'winning-avg-corewars__F3TaAEa', 'winning-avg-corewars__ektyjys', 'winning-avg-corewars__E7yaKUU', 'winning-avg-corewars__cQC4enF', 'winning-avg-corewars__hXPdgSA']",2,"[3628.171085, 4698.226795, 3600.003512, 3600.148603, 242.722011, 951.561942]","[15.9994, 1.900767, 3.564611, 4.124479, 29.296188, 83.284305]",0.3333333333333333,False,"['3366ff69-5908-47e2-be01-e1c302821e48', '3a8d151e-ffac-43d4-8e25-f1e9c3240654']" +claude-opus-4-1-20250805,write-compressor,7,"['2ee94be4-7881-45ac-a7a1-41a61464b228', 'cdb4125b-aab0-4e5b-ae65-d04645d202ff', '385d4f26-dc27-4699-b932-3d2166191eb9', '338b1c84-067f-4fd9-b8ec-fb8eace91e00', 'bddd6888-8633-4b27-aa57-3a331a7ff544', '1fa04da8-c87c-4ea9-8e91-f0686cb9f198', 'df4c9379-4877-41dd-9e37-8c26621bd71c']","['write-compressor__DXukyP9', 'write-compressor__vfM5ucN', 'write-compressor__pvo6dUy', 'write-compressor__k2CoczV', 'write-compressor__FDVAYZG', 'write-compressor__WCGQKBk', 'write-compressor__MFoGYm5']",0,"[911.137481, 900.00478, 1416.71387, 900.52265, 931.172761, 1261.303716, 910.186991]","[88.205348, 17.444636, 26.236, 25.811638, 65.172512, 26.070066, 119.771209]",0.0,False,[] +claude-sonnet-4-20250514,adaptive-rejection-sampler,5,"['9233f01e-96b1-475e-bdc5-99459abc838a', '39233179-868d-403a-8e48-6fbe668b79d9', '54ebaaa4-3ab0-4a84-b723-52034a84757c', 'd56cf36a-2b54-4729-9e7c-aa87f9276475', 'fc0a5e9f-368d-4891-a92e-05b6193c4e66']","['adaptive-rejection-sampler__V8M9s78', 'adaptive-rejection-sampler__oQpLftn', 'adaptive-rejection-sampler__BEqx7U2', 'adaptive-rejection-sampler__7nypC6s', 'adaptive-rejection-sampler__ohYbsqv']",0,"[913.14035, 900.046848, 900.005874, 780.211017, 906.989604]","[31.135203, 62.788335, 54.975925, 70.168473, 48.325161]",0.0,False,[] +claude-sonnet-4-20250514,bn-fit-modify,5,"['58c69ea6-265a-459c-a770-dca1ef81a615', '07cc1a7c-2b8e-43a8-b6ae-4236a0062451', 'dbf4a7b2-52ab-4ef6-8f54-b82966dd3bc8', '730e39b6-628a-434f-8c44-e2df076c5ed4', '6938d6ee-21ab-4e2c-ab37-99a16aee4b9c']","['bn-fit-modify__x5uqEGR', 'bn-fit-modify__avU2ktZ', 'bn-fit-modify__aqQwQFs', 'bn-fit-modify__nbJopyP', 'bn-fit-modify__dfkro3Y']",4,"[820.136814, 644.112219, 2270.286565, 806.876033, 529.07358]","[171.963578, 68.982205, 15.12867, 70.129608, 21.518367]",0.8,True,"['58c69ea6-265a-459c-a770-dca1ef81a615', '07cc1a7c-2b8e-43a8-b6ae-4236a0062451', '730e39b6-628a-434f-8c44-e2df076c5ed4', '6938d6ee-21ab-4e2c-ab37-99a16aee4b9c']" +claude-sonnet-4-20250514,break-filter-js-from-html,5,"['ef387938-4766-4702-ba44-0f1eed497cb2', '94bcdadf-25b2-4e47-8082-25ed7da15410', 'c4655063-bd02-42e0-9495-a74111a73a7e', '1e1257c2-0bc8-4762-881e-cf7fab034b48', '7aa22908-352c-455e-90ea-03d2da162882']","['break-filter-js-from-html__BZG266D', 'break-filter-js-from-html__8vWY4c2', 'break-filter-js-from-html__5dPJGuo', 'break-filter-js-from-html__26SQbmP', 'break-filter-js-from-html__qyKoPYs']",0,"[1201.584268, 1200.644363, 1203.851562, 1220.919695, 1204.815957]","[99.385173, 100.319438, 24.853214, 16.093682, 23.43454]",0.0,False,[] +claude-sonnet-4-20250514,build-cython-ext,5,"['1e869927-ca46-4089-b477-ae0e1573a940', 'ba4093ff-7655-40e2-9944-624782ad7916', '38b13cb1-e61d-4bd8-9b43-74c953ab9a22', 'd38d3fba-f8aa-4c1d-8c26-cd660d664238', '2cacddc9-541f-486d-bbf7-d2e3e9a14136']","['build-cython-ext__ErZsvV9', 'build-cython-ext__P2EA2Pe', 'build-cython-ext__c5YjzjK', 'build-cython-ext__dn7U2dq', 'build-cython-ext__b7CVVHe']",0,"[904.529451, 649.676938, 900.001076, 900.255359, 954.120021]","[47.889727, 211.786067, 39.306758, 9.133693, 129.950697]",0.0,False,[] +claude-sonnet-4-20250514,build-initramfs-qemu,3,"['27e63949-b341-40ff-b23e-77f3766addd3', '00377d41-cba4-44ff-b3d8-51866886ea96', 'e1e03b63-fe0d-47df-9b7b-3f4195ecd59e']","['build-initramfs-qemu__n5nem6t', 'build-initramfs-qemu__S4gwPsV', 'build-initramfs-qemu__6cBk5PD']",0,"[191.329906, 986.848407, 980.620983]","[16.8998, 29.974979, 22.764854]",0.0,False,[] +claude-sonnet-4-20250514,build-pmars,5,"['cda59b89-db78-4d9e-b12d-dbff945f4f53', 'aae8953f-6f75-4525-81d3-57317d7c935d', '07014b77-ca2a-49a1-853e-6a308973fa3c', 'c3130136-d5b3-4e6c-927c-b0a70c24d317', '9804fe7c-92d8-4761-b3e0-1c95efcedc94']","['build-pmars__v5ZqmTB', 'build-pmars__ezsi9hM', 'build-pmars__6iTCCBp', 'build-pmars__fBdz9cX', 'build-pmars__Y8x4ye6']",3,"[787.088101, 903.979358, 2066.811023, 314.732475, 432.533148]","[15.71523, 42.350568, 11.400012, 5.198745, 5.632364]",0.6,True,"['cda59b89-db78-4d9e-b12d-dbff945f4f53', 'c3130136-d5b3-4e6c-927c-b0a70c24d317', '9804fe7c-92d8-4761-b3e0-1c95efcedc94']" +claude-sonnet-4-20250514,build-pov-ray,5,"['b5e1b4c6-a8a3-4df9-8281-0b7b984fd07e', '688b62d2-8ddc-487e-b255-1b7c21b5d432', '68ecacf5-967f-4103-bb31-76686db36f44', '71928e96-c486-4790-8d04-2a14cf0a44ac', '9ea2f631-50b2-41fc-becb-fc67a783caf8']","['build-pov-ray__ref9cqZ', 'build-pov-ray__S9TdbpK', 'build-pov-ray__ctzqG6C', 'build-pov-ray__wSwMHKs', 'build-pov-ray__q9WDS9V']",3,"[828.924243, 1843.132151, 1883.394436, 2059.80543, 1275.507878]","[16.024816, 99.723079, 56.89661, 103.062513, 24.101326]",0.6,True,"['b5e1b4c6-a8a3-4df9-8281-0b7b984fd07e', '688b62d2-8ddc-487e-b255-1b7c21b5d432', '9ea2f631-50b2-41fc-becb-fc67a783caf8']" +claude-sonnet-4-20250514,cancel-async-tasks,5,"['fc085ff4-1ecf-4dd6-bdc6-a537e278afda', '7b3b5676-7179-4f92-8fa1-f669f91354c2', 'f17520ad-0263-46b5-b001-99fd9003db9c', '96560608-d32c-4317-96fd-0db05f68b7ff', 'd2fa32bd-4c64-4b4d-b159-2cf3daf2b5e4']","['cancel-async-tasks__ZFwgBV5', 'cancel-async-tasks__vpPjvn5', 'cancel-async-tasks__gCKNPnV', 'cancel-async-tasks__nmbgWWb', 'cancel-async-tasks__oDmWLcX']",4,"[160.756635, 857.03885, 214.053384, 429.56147, 130.056178]","[61.478621, 336.117733, 136.913079, 45.839497, 50.528687]",0.8,True,"['fc085ff4-1ecf-4dd6-bdc6-a537e278afda', '7b3b5676-7179-4f92-8fa1-f669f91354c2', 'f17520ad-0263-46b5-b001-99fd9003db9c', 'd2fa32bd-4c64-4b4d-b159-2cf3daf2b5e4']" +claude-sonnet-4-20250514,chess-best-move,5,"['de6ed5ff-979b-4f3c-99af-c85672494188', '108d5a4c-f6b6-4102-be4b-cfd5930c70ff', '48d37d5e-21b1-4335-a68d-9240069cc0a0', '9c192dbc-56df-4298-91be-9eb1866eebd6', 'f18235ff-1fd3-4b74-af46-28fe7cffa977']","['chess-best-move__nuJrYJD', 'chess-best-move__7HwHg66', 'chess-best-move__KDAhDWv', 'chess-best-move__NJJiib8', 'chess-best-move__P6iHHwc']",0,"[182.596906, 369.575414, 301.786249, 765.37166, 747.189363]","[7.909109, 15.353643, 13.506449, 25.135517, 17.304362]",0.0,False,[] +claude-sonnet-4-20250514,circuit-fibsqrt,5,"['3db7084b-51c4-4a32-831b-8e7fb7b7d3e7', '2f25a9ef-f508-4fdb-9826-0e0c442de532', 'f599bdca-c5f5-49a6-95c1-14a4a6ecbc66', '66acf2b0-01fb-44de-a29c-d1f341c79995', '5852e644-02a5-4a15-b7bc-86af6e464aa1']","['circuit-fibsqrt__4yRsZzm', 'circuit-fibsqrt__j8C2qt5', 'circuit-fibsqrt__oPPNuMe', 'circuit-fibsqrt__GWyXg7X', 'circuit-fibsqrt__VfBVHar']",0,"[1484.809645, 3593.166055, 3129.493289, 1212.977427, 1840.893847]","[12.666521, 38.987011, 56.007695, 78.345242, 46.838298]",0.0,False,[] +claude-sonnet-4-20250514,cobol-modernization,5,"['207b7983-33b7-4300-a546-111d3aaeda87', '92bebbe6-466e-40b7-ad70-6e3ad01a9e1c', '3cae6dcf-5752-485a-8f64-9504aaa65a79', '55fa376c-6a82-481a-9290-ae8db06fb526', '4f9ed2f7-68ac-4fb6-870e-92fb9a0b232f']","['cobol-modernization__zr7S5jC', 'cobol-modernization__Vr5PVKx', 'cobol-modernization__sDpGtJC', 'cobol-modernization__PN8oucw', 'cobol-modernization__xszWcus']",5,"[640.959331, 900.524519, 900.438976, 429.120695, 421.664031]","[104.074538, 120.417231, 36.030679, 50.195178, 12.681898]",1.0,True,"['207b7983-33b7-4300-a546-111d3aaeda87', '92bebbe6-466e-40b7-ad70-6e3ad01a9e1c', '3cae6dcf-5752-485a-8f64-9504aaa65a79', '55fa376c-6a82-481a-9290-ae8db06fb526', '4f9ed2f7-68ac-4fb6-870e-92fb9a0b232f']" +claude-sonnet-4-20250514,code-from-image,5,"['66d7d325-0c65-4beb-aec6-e109d97d67e9', 'd6d3c95f-e1b7-4755-9b50-928646599244', 'f9411475-ddb3-4b2b-989e-8e98f3f1ecf3', 'd83d993e-0600-4854-b8d2-213ce62d19ff', '7532947f-61e9-4afd-96b1-63fa5afef698']","['code-from-image__khpGPNE', 'code-from-image__gAZY2Xc', 'code-from-image__pjHFtfn', 'code-from-image__6hfGGSH', 'code-from-image__KsTD5Qf']",1,"[347.249671, 595.062854, 536.517756, 502.339511, 1233.638751]","[21.701877, 15.852382, 88.367477, 150.887184, 45.840111]",0.2,False,['f9411475-ddb3-4b2b-989e-8e98f3f1ecf3'] +claude-sonnet-4-20250514,configure-git-webserver,5,"['e099d492-f6ab-4df8-9335-3911ab79927c', '6cdfd015-430d-4038-a4d0-a40c82d16fd2', '8838b73f-5c99-439a-b254-f32398a23712', '84edd2dc-c29d-4987-b092-a7702cd0a6db', '0f5d9b94-364b-448d-a937-dbd0629b05b1']","['configure-git-webserver__WMQocS2', 'configure-git-webserver__mPsN8oC', 'configure-git-webserver__wJiZidw', 'configure-git-webserver__sSCFwz8', 'configure-git-webserver__WBodEQK']",3,"[741.377653, 513.829686, 411.967293, 869.832717, 786.889597]","[40.703094, 91.247002, 21.881356, 100.605039, 60.32331]",0.6,True,"['e099d492-f6ab-4df8-9335-3911ab79927c', '8838b73f-5c99-439a-b254-f32398a23712', '0f5d9b94-364b-448d-a937-dbd0629b05b1']" +claude-sonnet-4-20250514,constraints-scheduling,5,"['f7ca3fe2-4ea0-406b-8f53-d01482eb21fe', '122dedad-0280-4369-84f9-8a805cf13c94', '1eb170f7-f27f-4f59-b7a7-2927e1ce68c8', 'b5323013-0018-4c91-95af-42a8586c897e', '426c4365-5cf9-4b6b-8529-2c294aebdd07']","['constraints-scheduling__tPRZNfF', 'constraints-scheduling__87ApYPw', 'constraints-scheduling__EndPv3o', 'constraints-scheduling__nhk48MC', 'constraints-scheduling__3nuZC39']",5,"[290.927141, 818.115168, 477.372967, 441.858093, 403.9593]","[14.653464, 116.667374, 75.460235, 58.982023, 100.455927]",1.0,True,"['f7ca3fe2-4ea0-406b-8f53-d01482eb21fe', '122dedad-0280-4369-84f9-8a805cf13c94', '1eb170f7-f27f-4f59-b7a7-2927e1ce68c8', 'b5323013-0018-4c91-95af-42a8586c897e', '426c4365-5cf9-4b6b-8529-2c294aebdd07']" +claude-sonnet-4-20250514,count-dataset-tokens,5,"['bc06179e-f63f-4b42-8e3d-517056c0f246', '09f3ed25-7b78-415f-88d1-6a34fcd57659', 'ac7092e1-59c8-4211-a7e5-0f0068280fc1', '3d46f0d9-7f95-42c8-8daa-6a115909702e', '7a156489-ea08-4fc5-9b15-b169c9fde7cf']","['count-dataset-tokens__pEgtwqP', 'count-dataset-tokens__VbmyvNp', 'count-dataset-tokens__vUM9CHm', 'count-dataset-tokens__g9XjJod', 'count-dataset-tokens__dBx7rQk']",0,"[903.145696, 870.010049, 326.745536, 850.169258, 708.12527]","[79.608784, 35.593887, 8.17123, 38.611983, 27.664808]",0.0,False,[] +claude-sonnet-4-20250514,crack-7z-hash,5,"['3efbef34-1841-4433-be94-a61b3662bc3a', 'c5d3d342-c9fb-45e8-b6c9-7112ff160da8', '253fc76a-b10c-409c-84a9-307abcb25b2c', '3fd05fe6-3ed3-4822-ad45-07c328c4d8d7', '00b3868a-38bf-42c8-bb15-d45f22f48f65']","['crack-7z-hash__TNUhMme', 'crack-7z-hash__PPHHNKe', 'crack-7z-hash__egrrJcP', 'crack-7z-hash__NsqSJAU', 'crack-7z-hash__LErBRwb']",5,"[488.225367, 664.830349, 454.122763, 342.291987, 411.545471]","[15.21892, 17.542364, 31.628644, 37.642892, 10.647186]",1.0,True,"['3efbef34-1841-4433-be94-a61b3662bc3a', 'c5d3d342-c9fb-45e8-b6c9-7112ff160da8', '253fc76a-b10c-409c-84a9-307abcb25b2c', '3fd05fe6-3ed3-4822-ad45-07c328c4d8d7', '00b3868a-38bf-42c8-bb15-d45f22f48f65']" +claude-sonnet-4-20250514,db-wal-recovery,5,"['fb27d323-5f8d-455e-adb1-98ff41cc4828', '16a1bfd6-e77b-4579-9d5e-9f0244a6b98e', '8fbbaa08-b3b9-4621-a646-91e8e6ff4818', '94aeadb8-7ef8-464c-9e36-42b9da372884', '1c3ba781-ef0d-4307-88be-4a47b29dd401']","['db-wal-recovery__f74zoZq', 'db-wal-recovery__uJDtAbj', 'db-wal-recovery__7BZiXGP', 'db-wal-recovery__dbNBvZ3', 'db-wal-recovery__6sa5TuE']",0,"[862.900372, 1024.431353, 941.266466, 261.830652, 307.527053]","[24.311253, 73.305063, 55.937318, 14.140732, 6.2269]",0.0,False,[] +claude-sonnet-4-20250514,distribution-search,5,"['56c6266f-c920-4be4-9ef4-4f59c5c66f0f', '69c34280-4a18-4f7d-996f-adaf65ee29ba', '6af7418d-3806-44ee-908d-4dba724d2eb3', '81866dec-0a7b-41b9-b34d-da7dbe0715a4', 'a83280f5-c068-456a-846a-06fc405c4110']","['distribution-search__Jkb8C2u', 'distribution-search__33crLei', 'distribution-search__7ogquUx', 'distribution-search__4xEB7Vb', 'distribution-search__CAV4WkY']",3,"[1126.075232, 1073.153483, 620.658975, 741.668815, 554.83574]","[206.596974, 50.136908, 136.878899, 8.503073, 27.124071]",0.6,True,"['6af7418d-3806-44ee-908d-4dba724d2eb3', '81866dec-0a7b-41b9-b34d-da7dbe0715a4', 'a83280f5-c068-456a-846a-06fc405c4110']" +claude-sonnet-4-20250514,dna-assembly,5,"['d71d756f-35c9-4f9f-99a4-f17d2dc0ccd6', '32853f59-59e8-42ae-acd8-6ef1cfb2e82d', 'e8de320d-ce85-4649-b046-e500b7fe7cfc', 'd9be9628-abe8-4272-80c1-b785230e27fa', 'e3cfd3b3-4453-46a4-836c-d8bdec71a9ff']","['dna-assembly__a25jLMr', 'dna-assembly__pPSepJd', 'dna-assembly__4jqqtQt', 'dna-assembly__zEFvCY4', 'dna-assembly__589vDjz']",0,"[720.023391, 735.313826, 748.965164, 755.008952, 777.460307]","[53.632032, 66.296488, 30.588696, 32.628623, 84.167023]",0.0,False,[] +claude-sonnet-4-20250514,dna-insert,5,"['d416f3de-255b-485a-a1c0-3bbbcb6a9ee1', '4fa68048-81b8-4d1c-bdf6-1f9498e5435b', '19d8c536-6f18-4fa9-913f-ae2fc6de081b', '549774d0-43cc-4e20-81f3-d865a384156d', '5271a0fb-d8d5-441d-9857-b2a21985fe9a']","['dna-insert__HerjgLC', 'dna-insert__gwjwuDk', 'dna-insert__zLTyCsq', 'dna-insert__fKCD7ni', 'dna-insert__KbAZEpD']",0,"[365.448887, 360.095015, 376.229573, 360.637374, 502.79937]","[52.604157, 26.409285, 16.413359, 29.431134, 50.409538]",0.0,False,[] +claude-sonnet-4-20250514,extract-elf,5,"['c32a6678-a974-4a8c-82c0-8a9a3c702bf2', 'fbed5025-a81d-4502-9017-527a16222baa', '7e161c6e-d4cf-4053-b3d8-6175596e50be', 'a72f974b-b3d7-4dab-b976-6195c30a5d43', 'd888aa36-01b0-4d0f-b388-ed48d1ee41a5']","['extract-elf__3CkY7Co', 'extract-elf__kTzLSev', 'extract-elf__3yz5rMD', 'extract-elf__b5n87Yv', 'extract-elf__GCqpsuE']",1,"[629.764203, 262.716691, 378.624993, 324.353545, 851.343673]","[59.779327, 19.733007, 96.609083, 18.047497, 53.139864]",0.2,False,['d888aa36-01b0-4d0f-b388-ed48d1ee41a5'] +claude-sonnet-4-20250514,feal-differential-cryptanalysis,5,"['852515e7-ae0c-45f5-92cc-064f9907e77f', 'f02f5826-1638-4464-aa0e-4b7d551c05cd', 'ec4dcdd3-8707-4b40-8d23-c33b6968810a', '05b61be6-aea8-4ff2-8c72-680cbb811d9b', '8c817bdf-e271-409e-ac30-a0178c7455bb']","['feal-differential-cryptanalysis__tKHPbet', 'feal-differential-cryptanalysis__pinr4Qx', 'feal-differential-cryptanalysis__jSRRKpV', 'feal-differential-cryptanalysis__YywVs83', 'feal-differential-cryptanalysis__qQNv6eK']",0,"[1807.219773, 1807.815899, 1800.00256, 1816.288025, 1386.949371]","[42.784474, 48.745629, 13.890039, 108.301513, 12.740045]",0.0,False,[] +claude-sonnet-4-20250514,feal-linear-cryptanalysis,5,"['0d9ebbae-d083-4cab-b55e-e8c42ab9fddb', 'ef7ae628-13fc-4d17-bcf2-69199b854edf', '95173a80-8a32-49d7-86ae-5cff8fadef75', '6e47495f-ed54-4bc7-b158-cb6f94028488', '605dbc0e-1ad7-4eae-908c-c88d4ed19720']","['feal-linear-cryptanalysis__o6BdcYN', 'feal-linear-cryptanalysis__uuJHbeB', 'feal-linear-cryptanalysis__QvVtCUT', 'feal-linear-cryptanalysis__qsPpVLM', 'feal-linear-cryptanalysis__nJBAGRg']",0,"[1800.001266, 1800.015578, 1800.008542, 1802.770913, 1800.68162]","[12.590332, 298.830892, 82.014467, 22.802394, 47.494369]",0.0,False,[] +claude-sonnet-4-20250514,filter-js-from-html,5,"['25626d83-ea6e-455d-ae88-70deb2dccd90', '9af0b005-a364-4e67-822f-8c7e23911e9f', '65f195a6-067f-4ba5-a867-9106500f4a41', '2b66e04a-d5f0-478a-bdbc-31fabcb68731', '92a32cb3-09d6-4401-96d0-e3a3d278681c']","['filter-js-from-html__v5TfLpw', 'filter-js-from-html__7LBBDWd', 'filter-js-from-html__jpHGjER', 'filter-js-from-html__JsAFkvq', 'filter-js-from-html__PSjBBL2']",0,"[515.436418, 755.653321, 901.335032, 490.116923, 413.173615]","[34.625291, 40.613384, 134.747083, 16.720031, 105.212741]",0.0,False,[] +claude-sonnet-4-20250514,financial-document-processor,5,"['26170339-13cd-4381-b254-c1d8ba1b4175', '5b30fff9-c502-48f3-a49a-859a5626461c', '59b5f829-1e37-4cd7-9f05-8ee6c1d89995', '8aa1f7e6-dbb8-4c35-87dc-7e2d63266444', '734e9b56-2e9d-4c27-9af3-318675ed0f80']","['financial-document-processor__Nwhubsc', 'financial-document-processor__649MisF', 'financial-document-processor__GrcymQW', 'financial-document-processor__sYuea85', 'financial-document-processor__SU6xtEh']",1,"[597.356623, 740.840784, 486.849086, 1027.384662, 1230.753223]","[21.443907, 247.092878, 20.148235, 54.37779, 301.963744]",0.2,False,['26170339-13cd-4381-b254-c1d8ba1b4175'] +claude-sonnet-4-20250514,fix-code-vulnerability,5,"['e0f3f922-f08a-469c-80fb-5e82048becd7', '4c533f4a-105b-4c41-b46f-beb7acf237b4', '0a84d848-147e-48f2-902d-b1a172df3b38', 'f559401c-c22f-43a9-ba03-1ab5a3a21e6c', 'ef2b94f2-8c1a-4541-9c6f-0d5dead5dca1']","['fix-code-vulnerability__EcmGxLG', 'fix-code-vulnerability__bRJz23Y', 'fix-code-vulnerability__Qj8rBPj', 'fix-code-vulnerability__hicMAf3', 'fix-code-vulnerability__5gcLQnP']",4,"[902.056481, 497.827049, 760.944782, 948.347104, 801.179318]","[20.864785, 4.531081, 58.790038, 17.48536, 73.76278]",0.8,True,"['e0f3f922-f08a-469c-80fb-5e82048becd7', '4c533f4a-105b-4c41-b46f-beb7acf237b4', '0a84d848-147e-48f2-902d-b1a172df3b38', 'ef2b94f2-8c1a-4541-9c6f-0d5dead5dca1']" +claude-sonnet-4-20250514,fix-git,5,"['d274f36f-cbc1-4837-b9da-0e41efd61101', '30ca15c5-20ba-4359-82b9-bc846cbb8d77', '62f43f2d-b0ba-4951-a283-26a4aa00e494', '54b89816-ca4e-4d5a-af6a-79b687fc8ddb', '3d7bd1b7-12e7-4b8f-b0ab-1977776a81e2']","['fix-git__wZBE3Uj', 'fix-git__BPfZiSp', 'fix-git__Na6Ztyw', 'fix-git__fSxB26X', 'fix-git__5FCW52Z']",5,"[103.529054, 275.255393, 480.673688, 199.990105, 184.343923]","[24.887904, 103.998099, 34.013296, 19.013792, 38.224772]",1.0,True,"['d274f36f-cbc1-4837-b9da-0e41efd61101', '30ca15c5-20ba-4359-82b9-bc846cbb8d77', '62f43f2d-b0ba-4951-a283-26a4aa00e494', '54b89816-ca4e-4d5a-af6a-79b687fc8ddb', '3d7bd1b7-12e7-4b8f-b0ab-1977776a81e2']" +claude-sonnet-4-20250514,fix-ocaml-gc,5,"['d5039454-20af-4a8e-8045-2c85406377ca', 'b01af900-ff04-4e4a-b965-3b825a949c84', 'ee5a7b12-ec19-449f-9741-a330a8f0aff8', 'ef49ec7b-fc99-4196-acbf-87725925b51c', '0d593502-a027-415c-bfc6-71412ce4999a']","['fix-ocaml-gc__ur7hxpz', 'fix-ocaml-gc__CCMVpCT', 'fix-ocaml-gc__PvBaBwA', 'fix-ocaml-gc__SFXKcAN', 'fix-ocaml-gc__XXRV24a']",0,"[1277.170482, 3611.41212, 3604.199857, 3600.63477, 3837.073705]","[262.958628, 81.892925, 60.459387, 23.954189, 33.608073]",0.0,False,[] +claude-sonnet-4-20250514,form-filling,5,"['4d9729b9-11c3-47ff-9a6a-cc1b6581cd8a', 'f8150528-fc88-4b6f-969c-3069167190be', 'c0eedf95-ceef-4ea6-bffd-d425cc841585', '25b4e369-a625-4567-8011-07a293e34937', '5f234901-445e-482f-8ce2-e9e2a082a74c']","['form-filling__sgF7hUb', 'form-filling__o93iSiX', 'form-filling__iWMEA34', 'form-filling__QSkTKKa', 'form-filling__GqSKnGb']",5,"[417.172156, 637.550871, 277.06691, 423.387936, 338.867321]","[16.266752, 12.655206, 4.871517, 9.89, 58.162026]",1.0,True,"['4d9729b9-11c3-47ff-9a6a-cc1b6581cd8a', 'f8150528-fc88-4b6f-969c-3069167190be', 'c0eedf95-ceef-4ea6-bffd-d425cc841585', '25b4e369-a625-4567-8011-07a293e34937', '5f234901-445e-482f-8ce2-e9e2a082a74c']" +claude-sonnet-4-20250514,git-leak-recovery,5,"['5828f51b-7e9a-49c5-95cb-5975c95a317c', '5623a04b-13fa-490d-9942-b03ff68ac1fc', '374a8aba-7613-4678-834c-bd7638170198', 'fe619032-d2c6-46a8-874e-469faedd2136', 'e7590a6a-2c16-4cf1-8cdb-6579359fd3c0']","['git-leak-recovery__H4HHTaR', 'git-leak-recovery__Z7DhaQt', 'git-leak-recovery__YEPGUiT', 'git-leak-recovery__KAcySGP', 'git-leak-recovery__4RnTgEu']",5,"[376.98746, 389.821232, 519.911198, 307.443792, 242.261075]","[53.745698, 51.92641, 48.700533, 57.750853, 30.339853]",1.0,True,"['5828f51b-7e9a-49c5-95cb-5975c95a317c', '5623a04b-13fa-490d-9942-b03ff68ac1fc', '374a8aba-7613-4678-834c-bd7638170198', 'fe619032-d2c6-46a8-874e-469faedd2136', 'e7590a6a-2c16-4cf1-8cdb-6579359fd3c0']" +claude-sonnet-4-20250514,gpt2-codegolf,5,"['62f72753-02e1-47af-86e8-bd5c5d7e673f', '75d55ff2-8385-41a2-9b13-8a4bd3202062', '5efd346c-fef8-45e6-ba8e-158bf0485231', '08c4ae76-62af-48ac-bdaa-a03318c56d41', '710a23fd-d90c-4c94-bf0b-71fdcc11b68c']","['gpt2-codegolf__sBz7epP', 'gpt2-codegolf__ZyrZ4dr', 'gpt2-codegolf__8TBYpq5', 'gpt2-codegolf__S8683WD', 'gpt2-codegolf__m9vkX5X']",0,"[727.244777, 652.226257, 900.264474, 901.220506, 900.08802]","[28.89851, 222.366132, 67.42623, 35.564094, 117.353696]",0.0,False,[] +claude-sonnet-4-20250514,hf-model-inference,5,"['8d6e1a2c-550d-4f42-9d43-32e0532a60da', 'c1229020-7a50-449c-9bee-8a594898cfa7', '352afbf5-0d59-4617-a582-051cc17a0b21', 'd8e1bb84-c799-4a3c-82a5-7df1b83bcf42', 'dba1d7ec-2b63-4c1c-8a97-582055238660']","['hf-model-inference__Nq6Hszo', 'hf-model-inference__XDQTbv2', 'hf-model-inference__DWdk24C', 'hf-model-inference__YZe8Avc', 'hf-model-inference__S4hHiXX']",1,"[509.279584, 957.470013, 451.788547, 528.661928, 326.045056]","[48.183553, 31.011411, 57.660114, 29.27602, 79.463982]",0.2,False,['c1229020-7a50-449c-9bee-8a594898cfa7'] +claude-sonnet-4-20250514,install-klee-minimal,5,"['7997bee2-7b52-44ff-b829-eb4530aa2361', '05446873-ba91-483b-a235-2e70ce73e0b3', 'fd017dcc-4847-4433-8af4-9d825bb8dfb5', '121ff17a-15ac-43eb-bf32-79cb28c00cee', '9a8d8649-b56b-4fa3-b28b-00958cba7054']","['install-klee-minimal__xtoytZM', 'install-klee-minimal__5T2Eis6', 'install-klee-minimal__rAfnvND', 'install-klee-minimal__Zo4ikwX', 'install-klee-minimal__UQFoKXx']",0,"[900.559529, 900.508385, 900.292791, 903.034968, 900.070444]","[66.261692, 218.590163, 92.386035, 66.135013, 102.860013]",0.0,False,[] +claude-sonnet-4-20250514,install-windows-3.11,5,"['3c351a24-993d-4606-b41b-428d27d3c4ae', '27aa0684-23e7-4576-bc2a-a6bde44cba1a', '9cae2e44-2d01-4ea0-9678-ab5f90087f6c', '2dd57c40-3797-4348-aecf-ac2c11aeac50', '603b3cb5-35c7-4d2f-84c7-ead220ce665d']","['install-windows-3.11__YRMZnxu', 'install-windows-3.11__K9YRBvD', 'install-windows-3.11__xaJMXyE', 'install-windows-3.11__ZezyHW5', 'install-windows-3.11__gve6BUc']",0,"[446.727689, 1377.737715, 349.848141, 408.177102, 281.134732]","[30.852464, 40.787545, 13.804089, 28.551145, 63.495838]",0.0,False,[] +claude-sonnet-4-20250514,large-scale-text-editing,5,"['28314033-4e01-41a9-8e62-6e6cdc102943', 'ed7d62ec-44eb-4d38-a95d-8742047dab90', '0d7ff63f-b5ab-4cf2-8ec4-0848282919cf', '5b5bac83-1493-4690-b0c2-b0fa909b3f93', '628ea5a3-9861-4ac7-aae1-c13980af9ad1']","['large-scale-text-editing__tym6dwa', 'large-scale-text-editing__ftR4nrr', 'large-scale-text-editing__f77J5Yf', 'large-scale-text-editing__enfzRvL', 'large-scale-text-editing__VxxegWr']",3,"[524.042604, 1200.031628, 483.641946, 222.134031, 1243.338707]","[335.656589, 51.82602, 100.440362, 24.155805, 9.811633]",0.6,True,"['0d7ff63f-b5ab-4cf2-8ec4-0848282919cf', '5b5bac83-1493-4690-b0c2-b0fa909b3f93', '628ea5a3-9861-4ac7-aae1-c13980af9ad1']" +claude-sonnet-4-20250514,largest-eigenval,5,"['08e75dd0-5878-4a1d-89fe-b79780f11dc1', '01ee34f8-ada5-4462-8793-233fe6f4a60e', '958ed9ca-4650-43b3-8ba0-f86f0f4c20ec', '746adf2b-cdb4-4707-87c7-4414b106809f', 'cd7ef01a-96f3-4a9a-9d5a-3855aaf22a7b']","['largest-eigenval__WCp5P2F', 'largest-eigenval__iCnARjR', 'largest-eigenval__wxHKGAx', 'largest-eigenval__HkRoeJu', 'largest-eigenval__NzeDrhS']",0,"[902.578683, 903.644081, 906.091434, 846.486256, 949.621664]","[35.163894, 69.961199, 203.548271, 29.292864, 40.650751]",0.0,False,[] +claude-sonnet-4-20250514,log-summary-date-ranges,5,"['40276b94-d5bc-484e-9b87-78c8e2981b25', 'e19c5765-2c2d-4888-81bb-a1847ec6161a', '1b010f11-d81d-4372-a70a-c6da40acbc70', '6b194578-73b4-4f05-b022-f752e1852cac', 'a7af89f4-944b-477a-ac52-4c7df1305aee']","['log-summary-date-ranges__CZ6SRby', 'log-summary-date-ranges__UXrXrrD', 'log-summary-date-ranges__yS2nW3U', 'log-summary-date-ranges__Gz37RoG', 'log-summary-date-ranges__Ln4uwtc']",5,"[281.754222, 905.872455, 323.940119, 249.15373, 251.878141]","[60.703191, 58.173504, 170.495682, 86.298582, 140.25373]",1.0,True,"['40276b94-d5bc-484e-9b87-78c8e2981b25', 'e19c5765-2c2d-4888-81bb-a1847ec6161a', '1b010f11-d81d-4372-a70a-c6da40acbc70', '6b194578-73b4-4f05-b022-f752e1852cac', 'a7af89f4-944b-477a-ac52-4c7df1305aee']" +claude-sonnet-4-20250514,make-doom-for-mips,5,"['d75bb81f-7dd7-4569-b344-14baa7831d09', '3f4892b4-06c7-4cef-8173-5e86a83870ca', 'b09d1d86-61a0-4f16-be74-d1683d6bc58d', 'e0cd8363-037c-4c37-9209-47a1ff78067d', '64986aa9-fbd0-4208-bbd0-bc088a3849ac']","['make-doom-for-mips__2wFw6hv', 'make-doom-for-mips__mwdoSqr', 'make-doom-for-mips__oMn85Nk', 'make-doom-for-mips__kt8MP7L', 'make-doom-for-mips__4UPWvyj']",0,"[901.964344, 1139.812455, 905.482606, 908.84883, 943.464124]","[214.830791, 39.973896, 49.706003, 50.893097, 88.619411]",0.0,False,[] +claude-sonnet-4-20250514,make-mips-interpreter,5,"['f13f733e-e7af-4fa3-97d3-fdba0af836ae', 'ae3138f0-2540-4371-b691-427e74741a24', 'e1adb003-860d-4701-bf14-c4b12bea0670', 'ab4c763a-bf90-41f6-a18b-a1ae0858d47e', 'bc697001-3346-435b-b3c6-8f11bd9ae00f']","['make-mips-interpreter__Hfz7EGW', 'make-mips-interpreter__oXDQ6Wv', 'make-mips-interpreter__WF6Q9CU', 'make-mips-interpreter__q8JaUpV', 'make-mips-interpreter__eCSmHYC']",0,"[1816.518797, 1804.113501, 1831.935171, 1802.642155, 1432.885008]","[75.274366, 128.350689, 18.766613, 160.842065, 23.040758]",0.0,False,[] +claude-sonnet-4-20250514,merge-diff-arc-agi-task,5,"['51b8307e-370c-41c4-93be-ff181fecbe67', '6026fc81-13ef-4c5b-a417-b19c79c72526', '8636c2e5-4372-491f-bbbb-4e44240a9a64', '2d6871f2-784a-436e-9972-739d90c258af', 'a6aa06dd-bb05-4352-a9f0-f0822d4f805c']","['merge-diff-arc-agi-task__DhcXAoJ', 'merge-diff-arc-agi-task__4SQ73jw', 'merge-diff-arc-agi-task__AifPBko', 'merge-diff-arc-agi-task__FPsQxkd', 'merge-diff-arc-agi-task__TsaFwLS']",0,"[901.14175, 408.617625, 811.21892, 798.267702, 901.797824]","[76.383579, 13.521116, 79.905225, 32.846349, 22.693918]",0.0,False,[] +claude-sonnet-4-20250514,model-extraction-relu-logits,5,"['2bc1a810-2c1f-40a9-9364-d2ee01dd1109', 'fab8b80d-b3df-45d6-a613-57241b5d125d', '0ff3f69b-56b5-454c-994e-edbbedef3979', 'c083db2f-7c25-457c-af72-a1a38065746f', 'c37c39e4-0c7a-46e9-819c-a37f9027b20a']","['model-extraction-relu-logits__dJBCg3h', 'model-extraction-relu-logits__8C2siwd', 'model-extraction-relu-logits__GsKi22a', 'model-extraction-relu-logits__tmChQVQ', 'model-extraction-relu-logits__tUKySnp']",0,"[524.281566, 706.415487, 368.724788, 718.960034, 1420.753144]","[121.405815, 33.094586, 104.199469, 15.701638, 14.963202]",0.0,False,[] +claude-sonnet-4-20250514,mteb-leaderboard,5,"['8db9717c-a718-467c-93bb-521575401644', '4b11afde-c593-4d2c-83df-d12f1b8008c1', '3a989814-8093-43c9-a91e-e6e657d3987e', '0dd6db81-a42f-4608-892d-64d3c445067f', '6687c461-5cb3-4b45-aac0-7902384f48d3']","['mteb-leaderboard__YgJDpxz', 'mteb-leaderboard__DQSQmuS', 'mteb-leaderboard__iywaoq8', 'mteb-leaderboard__BKTbuFB', 'mteb-leaderboard__axAnq9g']",0,"[58.604664, 681.757995, 20.98843, 60.790112, 160.061072]","[115.049323, 29.555478, 12.590633, 8.441113, 5.367837]",0.0,False,[] +claude-sonnet-4-20250514,mteb-retrieve,5,"['d5df5d43-7d4d-436b-9bcd-4929ce745323', '7db68ba8-e14d-4f08-9bbb-5faa755228af', 'a3b290be-abad-4ce2-b8b9-c3e5d3239159', '1a528372-4f54-40e6-92f3-b4f8f5db7fa7', 'cc328a2b-99c8-495c-9e9d-7b068f72e158']","['mteb-retrieve__uG5pVam', 'mteb-retrieve__YejRwdo', 'mteb-retrieve__d7uTLbS', 'mteb-retrieve__wiNT8Ns', 'mteb-retrieve__qcSuPAB']",0,"[468.498031, 281.241099, 183.194009, 326.787733, 232.474923]","[4.485186, 3.688195, 64.362172, 17.376076, 3.913398]",0.0,False,[] +claude-sonnet-4-20250514,nginx-request-logging,5,"['b7256ad5-b158-4c4c-a710-7128603f531e', '9ee16c08-cecb-46e2-9eaa-8eb39b2db039', '25a59681-30bd-494c-8d91-a7320a56800c', '7f64cd27-88f1-428a-b0f3-c6384f56e87b', 'f686c6dc-4ad8-4fbe-b859-e54c8940f247']","['nginx-request-logging__T9Pk9BK', 'nginx-request-logging__qqnGfy2', 'nginx-request-logging__QFLjUEC', 'nginx-request-logging__5EJy6ro', 'nginx-request-logging__xFykce7']",5,"[254.527126, 448.836396, 237.665196, 491.848489, 671.271016]","[48.010051, 104.56853, 13.198089, 77.294033, 60.947679]",1.0,True,"['b7256ad5-b158-4c4c-a710-7128603f531e', '9ee16c08-cecb-46e2-9eaa-8eb39b2db039', '25a59681-30bd-494c-8d91-a7320a56800c', '7f64cd27-88f1-428a-b0f3-c6384f56e87b', 'f686c6dc-4ad8-4fbe-b859-e54c8940f247']" +claude-sonnet-4-20250514,openssl-selfsigned-cert,5,"['764ea5e2-dd54-45fd-8bc7-5525451330d9', '09810eb0-c4a3-4d74-a503-3ff019dc2d56', '9cb8a272-20ef-4fd3-bb45-473903962437', '76db8ef1-d55b-4b76-82c2-7eeaa0ee9d73', 'bc506962-76de-4eed-9f96-d8646f41928c']","['openssl-selfsigned-cert__bv6aJwu', 'openssl-selfsigned-cert__Nz2PWzy', 'openssl-selfsigned-cert__H2zxqmr', 'openssl-selfsigned-cert__YP4DzVC', 'openssl-selfsigned-cert__45x9CUe']",4,"[292.147122, 166.601485, 249.032878, 1268.274704, 418.451482]","[81.068907, 117.568624, 24.851086, 163.38067, 47.511297]",0.8,True,"['764ea5e2-dd54-45fd-8bc7-5525451330d9', '09810eb0-c4a3-4d74-a503-3ff019dc2d56', '9cb8a272-20ef-4fd3-bb45-473903962437', 'bc506962-76de-4eed-9f96-d8646f41928c']" +claude-sonnet-4-20250514,password-recovery,5,"['889967a4-8c41-482a-8daf-f679f80b049c', '7581e486-f025-4d2a-a95f-4628a3e0c9f2', '9e3c93af-92f8-4104-ae4d-cb74402303e3', '84aa6535-9a4f-4791-aae2-b69f5a20c1fb', 'c18480b4-b3d9-413b-ba83-535f8945e605']","['password-recovery__5Xki8Gk', 'password-recovery__hYdRZCQ', 'password-recovery__w3uh68p', 'password-recovery__JuFKpmb', 'password-recovery__XFokVu5']",2,"[864.163425, 900.000618, 475.896713, 574.155521, 900.889209]","[79.821351, 43.038122, 44.486019, 16.463903, 29.224977]",0.4,False,"['889967a4-8c41-482a-8daf-f679f80b049c', '7581e486-f025-4d2a-a95f-4628a3e0c9f2']" +claude-sonnet-4-20250514,path-tracing,5,"['33e66ecc-3e50-460d-ab42-eba27e76550e', '00b0e268-080e-4a30-bb5f-921019fa3797', '06011a48-5bb2-4572-a348-5d57a1cca624', '15b7bc11-8cfd-49b9-84ac-7e79cdda30cc', '5f747fbc-102a-4372-84f4-b69ca27ebd17']","['path-tracing__jHWYvY6', 'path-tracing__hh9TMSZ', 'path-tracing__dNNzCwj', 'path-tracing__DJqNzg4', 'path-tracing__n8ThDUi']",0,"[501.448726, 532.645955, 1806.632549, 579.820103, 688.470896]","[146.160731, 16.09964, 14.928689, 36.086071, 86.926262]",0.0,False,[] +claude-sonnet-4-20250514,path-tracing-reverse,5,"['33c3b258-b34a-4df9-925c-971684edf076', '1a053e8f-4280-470f-a8e8-ffb2a6e869f8', '54313854-adce-47de-9c1c-9993e95a3b4f', '2b308509-85fb-4fd3-a85b-bd75b18e481d', '8eee870a-d4ed-491b-9bd4-abc0a8b79e60']","['path-tracing-reverse__3fddLDx', 'path-tracing-reverse__4HPyeXw', 'path-tracing-reverse__Tt6Gbgj', 'path-tracing-reverse__fnad2t7', 'path-tracing-reverse__cwRsokX']",0,"[1093.46063, 1630.085549, 1486.747992, 965.08116, 1265.003482]","[128.124693, 92.977812, 37.991382, 40.826526, 149.872778]",0.0,False,[] +claude-sonnet-4-20250514,polyglot-c-py,5,"['e929db16-6bfa-4b68-9b0e-1d59c45bfb71', '948b46f9-4622-4d42-aaf8-8181f0dc4eb6', '3b0fcfda-e096-4c3a-81ca-ab7b74de3f11', '23a1fe6f-4b26-4a39-b888-49cb5b80b99c', '1f48f955-08c6-46a1-b7ed-a7f2be8d50c1']","['polyglot-c-py__x3rZ4jw', 'polyglot-c-py__fQv7EE8', 'polyglot-c-py__RMmNFTB', 'polyglot-c-py__PGqZyfK', 'polyglot-c-py__hkoJJnT']",0,"[120.665617, 284.25121, 243.673757, 209.998694, 902.81744]","[20.933305, 35.841364, 25.460013, 17.673068, 41.188966]",0.0,False,[] +claude-sonnet-4-20250514,polyglot-rust-c,5,"['47386a09-06c2-42dc-82c7-3403a9b34349', '67f0de7a-25df-4e4b-8694-32235ee1275a', '183a1834-b322-401c-a75d-c458788d00a9', '43462abe-2444-41c2-a0a7-b4db7b35b726', '728d538f-d5fd-4007-9d6a-9e6db7198a32']","['polyglot-rust-c__iVRjjTn', 'polyglot-rust-c__uXTiKao', 'polyglot-rust-c__AmcgYu9', 'polyglot-rust-c__kbYaime', 'polyglot-rust-c__aJEChDH']",0,"[901.27832, 900.224497, 900.535424, 902.534725, 909.145594]","[28.741958, 14.301151, 271.251369, 128.280841, 45.921333]",0.0,False,[] +claude-sonnet-4-20250514,port-compressor,5,"['27f8e549-810e-4c14-ad4b-72fa01b28fc1', '5bf64581-bc7d-4cf2-bf1e-7bf347d7791e', '0f43cb55-2c61-45db-9b04-ad48d68f5781', '8b53bdd3-248a-4f20-8fd1-511eedd6f448', 'da48ae58-d3f0-4173-bf81-193cde60cf3c']","['port-compressor__HnXqiBs', 'port-compressor__raJ6Vk4', 'port-compressor__gM8KDXz', 'port-compressor__aCNqis3', 'port-compressor__hFiKjLz']",1,"[2872.485564, 3609.163831, 3617.737665, 3600.021671, 3600.007842]","[55.870813, 68.306909, 53.885792, 146.904429, 34.085694]",0.2,False,['27f8e549-810e-4c14-ad4b-72fa01b28fc1'] +claude-sonnet-4-20250514,prove-plus-comm,5,"['b5befc8d-dabc-4f55-a9aa-b6a13d364079', '6083b672-b030-41d8-bdf8-98b6801c2ab7', '7a470ea9-c6a1-44c0-b8bf-1182dfa7291f', '2046ff37-8d79-4b3a-b92d-f6d75afe18e6', '6f5eaaad-ff22-4b2b-9a0a-e77d647a8b29']","['prove-plus-comm__FKBHgsZ', 'prove-plus-comm__HKAoX7c', 'prove-plus-comm__ipsk4Tk', 'prove-plus-comm__aKFeY7W', 'prove-plus-comm__zNNxL3K']",5,"[448.93355, 489.077852, 279.200321, 198.77971, 124.80742]","[30.392774, 61.996815, 141.622238, 24.565705, 39.944673]",1.0,True,"['b5befc8d-dabc-4f55-a9aa-b6a13d364079', '6083b672-b030-41d8-bdf8-98b6801c2ab7', '7a470ea9-c6a1-44c0-b8bf-1182dfa7291f', '2046ff37-8d79-4b3a-b92d-f6d75afe18e6', '6f5eaaad-ff22-4b2b-9a0a-e77d647a8b29']" +claude-sonnet-4-20250514,pypi-server,5,"['0af2ceb3-da0d-4bf3-b889-dc7456542ec5', '90647da0-6851-4edf-8949-2218f4331045', '26729bb1-d9ff-4d90-bd8d-56932cb0d7b4', '283be447-df8c-433e-b586-e5c41031ab99', '81696cee-aec4-41fb-a3da-1a2d256a8171']","['pypi-server__tVZRozG', 'pypi-server__5oNZSwe', 'pypi-server__wUg22Vi', 'pypi-server__sQPDLev', 'pypi-server__5zxCK2Y']",4,"[408.477541, 570.69396, 518.259086, 1013.456787, 615.918587]","[44.570346, 85.302009, 202.858907, 200.39081, 101.370516]",0.8,True,"['0af2ceb3-da0d-4bf3-b889-dc7456542ec5', '90647da0-6851-4edf-8949-2218f4331045', '26729bb1-d9ff-4d90-bd8d-56932cb0d7b4', '81696cee-aec4-41fb-a3da-1a2d256a8171']" +claude-sonnet-4-20250514,pytorch-model-cli,5,"['5a31e89e-d186-4eb6-9291-b334cd3a80a5', 'b3255bde-5951-4e8d-bdb9-6f49db75e659', 'ace70c6f-52bd-451f-9fb9-c227108a7333', '1a85ecba-8e29-4b23-bc07-7cfae5a16c87', '5d1d38c7-c9f5-4b51-963c-ca8ca52dd2ec']","['pytorch-model-cli__YAZCVgm', 'pytorch-model-cli__s5HWt66', 'pytorch-model-cli__VyeGZzY', 'pytorch-model-cli__oihj7xJ', 'pytorch-model-cli__DpZyStK']",2,"[546.13274, 519.731355, 787.452802, 805.782644, 900.001649]","[27.82807, 82.6177, 99.977389, 32.408722, 67.400065]",0.4,False,"['ace70c6f-52bd-451f-9fb9-c227108a7333', '1a85ecba-8e29-4b23-bc07-7cfae5a16c87']" +claude-sonnet-4-20250514,pytorch-model-recovery,5,"['79d8264a-f5c3-443f-87e4-d7ecee3c561d', '042787c0-52d6-4d41-9140-bb0dac2b803e', '8c7af778-3908-402a-baa1-d28cff72d4ae', 'd8e453c2-2891-4f35-a246-a52b6e246ca1', '46075612-92dd-4445-b27b-76dd2711cbdc']","['pytorch-model-recovery__vhxy9oL', 'pytorch-model-recovery__oxggJ8t', 'pytorch-model-recovery__T3o5Hik', 'pytorch-model-recovery__eK9jdRk', 'pytorch-model-recovery__hP7HSCx']",5,"[443.183093, 574.999406, 547.444523, 281.056262, 901.875033]","[56.630584, 65.752779, 43.44883, 34.335257, 102.119859]",1.0,True,"['79d8264a-f5c3-443f-87e4-d7ecee3c561d', '042787c0-52d6-4d41-9140-bb0dac2b803e', '8c7af778-3908-402a-baa1-d28cff72d4ae', 'd8e453c2-2891-4f35-a246-a52b6e246ca1', '46075612-92dd-4445-b27b-76dd2711cbdc']" +claude-sonnet-4-20250514,qemu-alpine-ssh,5,"['da970dac-9368-40b3-bbaa-e2dc89d5f103', '6a72c6a3-67b4-4a41-b12b-64d2d42f9ec0', 'e5ded101-a798-460f-94f9-cb01ac5cc0f3', 'cc8c841a-774e-4ea9-b732-fafa8c12cb81', '35e727c3-cd38-465a-b6c0-0284251a3495']","['qemu-alpine-ssh__KmC42pT', 'qemu-alpine-ssh__8okJZan', 'qemu-alpine-ssh__7M7FpNE', 'qemu-alpine-ssh__gJGQVwu', 'qemu-alpine-ssh__b3k66y9']",3,"[646.304485, 600.721124, 551.596622, 1009.371395, 308.400338]","[9.368256, 15.875048, 76.185239, 6.25245, 28.363307]",0.6,True,"['da970dac-9368-40b3-bbaa-e2dc89d5f103', '6a72c6a3-67b4-4a41-b12b-64d2d42f9ec0', '35e727c3-cd38-465a-b6c0-0284251a3495']" +claude-sonnet-4-20250514,qemu-startup,5,"['40105664-d7d9-4161-aa81-fbe8ecc3d460', '8eff9bc9-5442-46ca-a223-40ecf47af59a', 'ddee4f23-9621-449a-ae45-e4b4b8d12da6', 'b3329310-2870-4d7c-993f-e1aafe12dd8e', 'f7ad557c-12ed-4ce0-8b33-694dbb81190d']","['qemu-startup__xbVWGYc', 'qemu-startup__HxGmChM', 'qemu-startup__RnSj5Q2', 'qemu-startup__XkRWwbU', 'qemu-startup__sqCKjpL']",2,"[915.963414, 905.482006, 903.382758, 909.511829, 768.555707]","[41.462526, 3.641036, 15.650509, 13.45561, 9.517684]",0.4,False,"['40105664-d7d9-4161-aa81-fbe8ecc3d460', 'f7ad557c-12ed-4ce0-8b33-694dbb81190d']" +claude-sonnet-4-20250514,regex-log,5,"['40a54beb-c1e6-4b7d-9905-9a70233b278c', '2fbed525-2d74-40bb-8b93-e42bfebbb3ec', '6bf2a2bd-d3d6-4179-9a29-3e7afb95dad9', '8dd05b49-b4e4-4652-87dd-207dc51d5387', 'aa1d1daa-08fb-4f85-929d-ce91ed1ef9ab']","['regex-log__3Hr8pVp', 'regex-log__nthgCL5', 'regex-log__bhJ6gaS', 'regex-log__rCRDkpr', 'regex-log__hzKPtQq']",4,"[394.074606, 238.051022, 252.274683, 128.273127, 486.005807]","[34.032436, 225.003763, 164.391925, 151.194799, 42.75356]",0.8,True,"['40a54beb-c1e6-4b7d-9905-9a70233b278c', '2fbed525-2d74-40bb-8b93-e42bfebbb3ec', '6bf2a2bd-d3d6-4179-9a29-3e7afb95dad9', 'aa1d1daa-08fb-4f85-929d-ce91ed1ef9ab']" +claude-sonnet-4-20250514,reshard-c4-data,5,"['8b44e4fd-0af6-4b87-9907-6af662d9231b', '40488afa-6691-4eb4-927f-fbfbf1cc9b9d', 'a5c7c2f4-f26e-426f-aa1e-117ca5e40f48', '2a7c987c-604b-4e93-a45d-9e44554555bd', '70b4e21e-58cc-4ec5-bf06-754283ad6206']","['reshard-c4-data__KLwGt8Z', 'reshard-c4-data__2iwUSaX', 'reshard-c4-data__4ujCmaq', 'reshard-c4-data__xbYeJT5', 'reshard-c4-data__9wKdbLU']",0,"[900.587631, 900.401121, 1835.648696, 451.346809, 495.955441]","[252.692532, 57.224747, 94.00394, 101.674785, 112.685748]",0.0,False,[] +claude-sonnet-4-20250514,reverse-engineering,5,"['5fca7c12-2229-4b02-9d4d-2cefcd9d93dc', '7fc0b3c6-c172-4ad1-82c0-8cc16c9f0746', 'b88074c6-bcff-41b7-b324-bfec10242d44', 'a46ecde0-6724-486e-8e17-9f9289e2bb08', '13dfea1f-a6f0-4b8e-b051-7f844898b6df']","['reverse-engineering__b93e84T', 'reverse-engineering__PBUfq25', 'reverse-engineering__Re6nhbK', 'reverse-engineering__GqVPpqE', 'reverse-engineering__LQYaKPb']",0,"[1805.487131, 1800.534735, 1809.554577, 1800.460828, 1800.001568]","[28.27818, 11.708686, 45.482932, 28.439922, 82.005317]",0.0,False,[] +claude-sonnet-4-20250514,run-pdp11-code,5,"['5d8e8b0d-b08b-4f19-8aba-c4c3f4c5218c', 'd3847054-5ee8-45d9-8739-d9c18f287e2e', 'b6726919-cf21-47fd-9940-e26eb93b98b2', 'c9e5da16-613d-4f92-80f1-38029855cf5b', '1a487bbd-b3f1-4fd6-9ce6-0f4ec59624ac']","['run-pdp11-code__VmMYnUd', 'run-pdp11-code__g2MzJSf', 'run-pdp11-code__mNXXQLv', 'run-pdp11-code__z5qPkoY', 'run-pdp11-code__TMs6tCG']",0,"[1001.265534, 559.257241, 1067.624187, 625.90093, 1039.243392]","[281.5589, 20.394519, 37.058626, 41.316058, 62.767889]",0.0,False,[] +claude-sonnet-4-20250514,sanitize-git-repo,5,"['7c46e0ff-7e20-4818-99a6-696ba088760a', '45ef3e22-0c00-4e15-8cb7-174143623546', 'aa4326ef-b6a7-4884-ab0d-f40bfaddb2d7', '55db6067-435f-43fd-a308-50ba39bb8106', '019fbdb9-f7d3-4475-a1a5-aaecae0e1a6f']","['sanitize-git-repo__A6Zr28M', 'sanitize-git-repo__cJF6PSU', 'sanitize-git-repo__9GHfmSr', 'sanitize-git-repo__hLJvpmF', 'sanitize-git-repo__gPGnxz3']",0,"[769.707821, 906.840565, 784.537945, 901.269109, 917.23959]","[19.74139, 79.6273, 25.971838, 14.18499, 20.742255]",0.0,False,[] +claude-sonnet-4-20250514,schemelike-metacircular-eval,5,"['12db81e6-9e97-4a1e-94b4-c2a458b48a84', 'f50b997e-5703-4006-8c6d-0aa3590f3f6c', '855d8bb1-5772-445b-925e-19be7213974e', '339da028-8c2d-443d-b471-07c917afb1b4', '1002e53c-73d9-4692-b6d2-0347eeccea75']","['schemelike-metacircular-eval__dG8TL6S', 'schemelike-metacircular-eval__QTjJXcD', 'schemelike-metacircular-eval__LAYXDZg', 'schemelike-metacircular-eval__fWkjp72', 'schemelike-metacircular-eval__x2tX8vn']",0,"[2400.626329, 2400.026386, 2402.966717, 557.23096, 2452.707799]","[119.895409, 209.426635, 43.526091, 40.194037, 40.717032]",0.0,False,[] +claude-sonnet-4-20250514,sparql-university,5,"['08ef2ddf-b5c6-4163-9e27-841c4c06876e', '8cc8d520-557a-4e13-89c2-fd21ada68f2b', '49ec91e7-60fb-4f0d-b6e1-68567f5f90ab', 'eb745a21-d8b6-41f7-a97f-dccb3248c928', '2c8bf95a-102c-4572-8010-c3898129d7c6']","['sparql-university__bgE6FaK', 'sparql-university__s72A9t2', 'sparql-university__mysB5Nq', 'sparql-university__ptemYtx', 'sparql-university__pQZNRqj']",0,"[1013.533783, 663.421862, 595.466802, 382.729176, 884.868928]","[277.003866, 46.881356, 119.904889, 89.041725, 90.200265]",0.0,False,[] +claude-sonnet-4-20250514,sqlite-db-truncate,5,"['d1c575cd-dc0e-4807-9d7c-0d5ffc7dc04a', '5fe43ab3-79df-4a1f-bce3-f78b5225b82d', '4363c7e4-bd6d-45a0-8ebe-0dd794754420', '5c2bd8d4-a671-4439-88ea-2938c391e038', '3cde7713-8499-4c45-aa48-2929cd9c6b49']","['sqlite-db-truncate__Q3fY9WR', 'sqlite-db-truncate__QNcDWCp', 'sqlite-db-truncate__k6qp7zh', 'sqlite-db-truncate__QyvnHF4', 'sqlite-db-truncate__tydxwrF']",0,"[203.612365, 795.044249, 426.912206, 396.272263, 279.11761]","[34.160087, 44.748655, 59.438358, 62.304726, 89.987261]",0.0,False,[] +claude-sonnet-4-20250514,sqlite-with-gcov,5,"['524f65d5-7371-4411-af61-8677b044a050', 'f943eb17-38ec-45d7-9156-57dc16ed976d', '1eba1354-4db4-4665-81f8-fcc0fdb58cb1', 'f91c8df8-8dcc-4560-8428-117a80792864', '78c8ff98-65e7-49bb-be76-7527e43dedf7']","['sqlite-with-gcov__kzLnX96', 'sqlite-with-gcov__zBLENTt', 'sqlite-with-gcov__226WBZJ', 'sqlite-with-gcov__cDxv4Nx', 'sqlite-with-gcov__kL4VHsq']",1,"[773.164517, 1001.348478, 486.47177, 595.000597, 362.022982]","[27.963541, 60.615874, 54.30838, 45.666564, 75.739346]",0.2,False,['78c8ff98-65e7-49bb-be76-7527e43dedf7'] +claude-sonnet-4-20250514,torch-tensor-parallelism,5,"['31903b1d-b565-410f-84b7-9818a9277888', '0fc04776-bb22-4e43-8c1c-8d0394ef5b4e', 'c40641fe-8ddf-48f0-94fe-59c0465eecbd', '62fdd083-226e-4183-bbd8-88a6f12277e6', '9255d4c7-9963-4b2b-a0c7-252619f1afcf']","['torch-tensor-parallelism__wJwc3zS', 'torch-tensor-parallelism__qLKgwq5', 'torch-tensor-parallelism__TTH6T42', 'torch-tensor-parallelism__gXE2ZuG', 'torch-tensor-parallelism__E5YeHAE']",0,"[155.309924, 94.305263, 173.524139, 185.69269, 344.673573]","[40.995995, 40.918336, 42.312442, 47.6956, 123.090006]",0.0,False,[] +claude-sonnet-4-20250514,train-fasttext,5,"['f4e2e17b-4463-468e-9b50-5b197465dd0b', 'f929d823-dee6-409e-9db1-d405031e0364', 'd55842c3-4000-4d30-9d39-1ed8c8ae39b2', 'e19791a2-18bb-48be-b6c1-a571f73ed317', 'a875fca5-bec3-4a26-8344-a936d8ffc665']","['train-fasttext__onn4Fdx', 'train-fasttext__WZc3Fw7', 'train-fasttext__hgoS5AB', 'train-fasttext__huGuF34', 'train-fasttext__wqypc6r']",0,"[3606.13041, 1564.457289, 3647.624007, 3632.178211, 3600.344847]","[28.322687, 14.864133, 23.817425, 55.616627, 60.596791]",0.0,False,[] +claude-sonnet-4-20250514,tune-mjcf,5,"['f4a635bb-c4ef-4bef-a2a9-5bf0a4b993e3', '9b2bc8be-0cdf-408f-a68d-f2ce61857c7d', '09d503f6-3201-4e56-afbf-c7fab57aafdf', 'ae90ff68-d2ef-4557-a55e-6e07c1df3428', '9002e43e-163d-4f5b-aaf8-b199d55abd51']","['tune-mjcf__vRUfTtf', 'tune-mjcf__BUJfTah', 'tune-mjcf__wxZH78S', 'tune-mjcf__9xuf27v', 'tune-mjcf__oRw4mjU']",1,"[900.090081, 903.328349, 903.023557, 335.184879, 949.742623]","[9.529688, 25.192572, 34.860945, 15.53575, 28.76333]",0.2,False,['ae90ff68-d2ef-4557-a55e-6e07c1df3428'] +claude-sonnet-4-20250514,video-processing,5,"['fefd6259-132e-4ed0-b7a3-18a1dd449598', '72441315-2887-46c0-9164-780e68361e70', 'beb42e90-b6e2-4448-b750-dec215da40a8', '72afd092-4dc5-49fa-b4df-e19476df99db', '98c85ef1-1886-4d04-93a9-36d48e7fa859']","['video-processing__v22AqD4', 'video-processing__7pFBYxY', 'video-processing__jB9CaZu', 'video-processing__DMwMqBc', 'video-processing__tpg7BkT']",0,"[242.910185, 238.995213, 595.645043, 505.344073, 284.249982]","[43.008945, 38.935217, 36.53366, 37.54378, 159.674364]",0.0,False,[] +claude-sonnet-4-20250514,vulnerable-secret,5,"['776ea66e-ef0f-4154-9bb4-d3894c794198', 'fa2edbb9-a728-4af7-b0c9-10093ded35b1', 'b806eeac-65bb-4d9f-af81-32a9487409c7', '5685eabb-5488-422b-b191-19ddcfeeba45', 'bdc8892c-bbea-4564-a78a-4b678bf45e80']","['vulnerable-secret__mp4Tpbz', 'vulnerable-secret__9S6xYST', 'vulnerable-secret__MorUZVU', 'vulnerable-secret__oHYYq6a', 'vulnerable-secret__2oxrNEz']",0,"[900.147484, 906.159663, 900.136937, 906.757759, 936.769757]","[10.277741, 64.755995, 14.606473, 68.874403, 65.989834]",0.0,False,[] +claude-sonnet-4-20250514,wasm-pipeline,5,"['863f0fa2-4254-4da1-b6b5-cf6685825362', 'c938f063-6418-4386-88ff-f6cd39264402', 'e3191908-bc63-4d5d-8db9-1995d863ef37', '0a63537f-7450-4da3-84b4-89cf6044ca72', '16f43645-c8a5-467c-b37b-1f43313e9ec4']","['wasm-pipeline__hFfPajz', 'wasm-pipeline__ANzjHfo', 'wasm-pipeline__okGYqFH', 'wasm-pipeline__V3HpQjR', 'wasm-pipeline__HuVDMYt']",3,"[798.060662, 408.234483, 474.62786, 835.237167, 527.599633]","[21.53203, 5.27028, 10.860162, 4.55111, 34.383665]",0.6,True,"['c938f063-6418-4386-88ff-f6cd39264402', '0a63537f-7450-4da3-84b4-89cf6044ca72', '16f43645-c8a5-467c-b37b-1f43313e9ec4']" +claude-sonnet-4-20250514,winning-avg-corewars,5,"['e3a685c1-c023-4dca-a60b-83cd5c93342c', '33dc4748-587a-4c9a-b29c-3d15b7a6fb1f', '11e10e32-c808-4617-a5c6-a35438ee25ec', '0ab2a2c3-3e70-4e61-b6bc-6a371f18180c', '3b6ae06e-0b7c-47fa-81d2-7b082207e94b']","['winning-avg-corewars__3jBKgER', 'winning-avg-corewars__qiUT9ra', 'winning-avg-corewars__gLtSkMA', 'winning-avg-corewars__FS8y4j5', 'winning-avg-corewars__VaiP2Yv']",0,"[1086.853986, 1984.640415, 1921.203205, 1962.447596, 3817.485632]","[51.533113, 59.668235, 64.502706, 4.583127, 5.034198]",0.0,False,[] +claude-sonnet-4-20250514,write-compressor,5,"['b1c4728f-641a-406d-a1b6-1f5dabc607c8', '939960f1-6c39-4330-9dd4-9a1918291666', 'eea220be-b6c8-4983-a6ec-d57cde4fbb09', 'e12a173d-734f-46f5-8240-9491a4017210', '209be4c8-0bd3-4dba-a270-f2f26f4b9d4a']","['write-compressor__XzKwpuX', 'write-compressor__n6bXKU5', 'write-compressor__ztFu63G', 'write-compressor__Udce7Nu', 'write-compressor__QpHuJqq']",0,"[904.585595, 900.03297, 900.001485, 900.945399, 1416.858009]","[32.701985, 67.788881, 53.919296, 51.544861, 18.969036]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,adaptive-rejection-sampler,5,"['cd7e45fd-cb30-4f4c-a2fd-819027102a24', '81a5c951-9163-418e-b7d2-b1735d14a57a', 'd99ac1e3-8197-4b2e-9f6e-6e1054dc5490', '2a273648-a6f4-41dc-bc0c-52077b1c0f78', 'b52367d7-d6ae-4ac9-befa-b578ea630571']","['adaptive-rejection-sampler__LAuK7Ya', 'adaptive-rejection-sampler__DFj9rrK', 'adaptive-rejection-sampler__etgsTvX', 'adaptive-rejection-sampler__CtwiMYD', 'adaptive-rejection-sampler__JKsQevX']",1,"[921.045348, 901.072124, 909.159333, 900.006481, 904.762378]","[230.647192, 86.351948, 47.520102, 23.039177, 132.336483]",0.2,False,['2a273648-a6f4-41dc-bc0c-52077b1c0f78'] +deepseek-ai/DeepSeek-V3.1,bn-fit-modify,5,"['3bf026a8-8878-4aac-8a89-18ece7b0e54f', '69910ede-e92f-479c-8f2a-7d02ef9d1f6c', '9926281f-2c4f-4588-8fa3-aa49548459f4', '9aec2289-409b-498e-b4cb-591fe49ad2ba', '3eae4e47-31ee-4938-88ec-495b1e16a3ee']","['bn-fit-modify__c7wtMEn', 'bn-fit-modify__jmzXYB4', 'bn-fit-modify__J4NnLti', 'bn-fit-modify__GC5mD47', 'bn-fit-modify__5hTJS6k']",0,"[1015.560609, 805.205108, 764.198961, 3003.956623, 257.77484]","[44.088396, 28.250321, 165.02589, 25.474881, 102.138555]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,break-filter-js-from-html,5,"['9946fe4b-1f16-4b2a-869c-67978b1ce6e7', '36b8b409-f1f9-4459-af0a-3eaa448c3a8b', '4d5a7857-dda2-44ef-933b-ebee4ddb8e43', 'eb80e1a1-98a1-4476-9428-199df528a4ee', '7f5a9e0f-6988-4683-bb2f-331b783fa8b9']","['break-filter-js-from-html__iYGyoZ6', 'break-filter-js-from-html__jSa68h5', 'break-filter-js-from-html__sE6uLcH', 'break-filter-js-from-html__sVQqUGx', 'break-filter-js-from-html__9uAVqst']",0,"[1222.818287, 423.41117, 168.862087, 1252.880764, 386.618178]","[15.891394, 39.504776, 30.49194, 99.538045, 83.415246]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,build-cython-ext,5,"['59473358-544b-4863-9c1a-1abb1bfebab5', '881f9246-490c-428a-92f6-8099e0aab85c', '6bc07c9a-12d2-4db9-95c7-869a58990822', 'c936df74-0c2a-4003-a8e9-7678b8b1b0ca', 'cc48fed2-91d7-4c3f-8eda-ed44ed0966c5']","['build-cython-ext__mMT94xf', 'build-cython-ext__JyuXsrf', 'build-cython-ext__TEJmLAf', 'build-cython-ext__fDT5kon', 'build-cython-ext__btSwFCh']",0,"[906.657237, 900.421584, 590.375358, 795.004501, 476.681314]","[35.288534, 109.611359, 66.337733, 135.136694, 19.496544]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,build-initramfs-qemu,5,"['e9898836-4c94-4f10-a6d6-6153b9926f9e', '2da9257d-d798-45cc-934b-cec9f4474f82', 'e2d13ced-cf43-4c98-b974-110ab55f648e', '6ace35a6-8943-44fe-ab50-12a804888879', '311a2ea0-2081-4549-a236-3c90f0924f6a']","['build-initramfs-qemu__HAyJjew', 'build-initramfs-qemu__BDghdvw', 'build-initramfs-qemu__QjcN8FN', 'build-initramfs-qemu__apUCqQE', 'build-initramfs-qemu__ceyzcV5']",0,"[906.348501, 902.509799, 900.191695, 900.263867, 903.062251]","[54.798184, 39.907266, 48.877912, 25.005287, 37.682834]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,build-pmars,5,"['4fbefe11-44f5-42ce-b8ca-7b64d20697f1', '0a5b4755-e74a-4188-aa96-99d5d7e47808', 'c433bb70-3d29-4517-92c6-3e8ba4f64b8b', '1458a7c2-1249-4032-a516-3e4598c1a0e3', 'c020c02b-6cf4-4bd0-a81b-2bcd96c01deb']","['build-pmars__SBbuzKD', 'build-pmars__gaaHHmj', 'build-pmars__9AWvMXE', 'build-pmars__F5E59Tq', 'build-pmars__PjRXkLb']",5,"[364.590255, 252.559786, 345.27496, 236.012856, 424.46778]","[55.158682, 9.744596, 28.915165, 3.304711, 10.901515]",1.0,True,"['4fbefe11-44f5-42ce-b8ca-7b64d20697f1', '0a5b4755-e74a-4188-aa96-99d5d7e47808', 'c433bb70-3d29-4517-92c6-3e8ba4f64b8b', '1458a7c2-1249-4032-a516-3e4598c1a0e3', 'c020c02b-6cf4-4bd0-a81b-2bcd96c01deb']" +deepseek-ai/DeepSeek-V3.1,build-pov-ray,5,"['860bd125-e82a-455d-a4f2-66778adfde77', '14d3f843-9db3-4ee6-a8e6-68a12e6153fa', '193e57c9-2515-419b-ba43-c099fa13b2be', 'd9614988-4b95-4409-a8e0-9345e439c5a3', '66bfefa1-69b8-4e3f-9ee1-a37207314321']","['build-pov-ray__aGQrMHc', 'build-pov-ray__6xenUtP', 'build-pov-ray__xoY98qN', 'build-pov-ray__GbzRGra', 'build-pov-ray__QhuU5H8']",2,"[2107.552499, 1001.618871, 2338.508084, 6213.433423, 483.486725]","[22.43157, 91.206657, 61.154776, 50.44504, 16.126741]",0.4,False,"['193e57c9-2515-419b-ba43-c099fa13b2be', '66bfefa1-69b8-4e3f-9ee1-a37207314321']" +deepseek-ai/DeepSeek-V3.1,cancel-async-tasks,5,"['591ef413-f093-4569-89b0-8f032a8d11fe', '01e207d2-b71d-43ed-81a8-b8e2c2e71036', '37509f38-6adc-4ef1-8386-42d58077ea1d', 'ecf2f8d3-2b98-4f2a-b906-c4307443caa8', '176090f4-0f48-4fba-9631-f9a39566165d']","['cancel-async-tasks__wK6byW6', 'cancel-async-tasks__aTorLAy', 'cancel-async-tasks__EJt2mVR', 'cancel-async-tasks__miG9bwM', 'cancel-async-tasks__D5LsRRj']",2,"[162.553326, 726.759106, 202.099645, 28.96675, 77.188323]","[53.376497, 159.575092, 47.358792, 71.305565, 55.027607]",0.4,False,"['591ef413-f093-4569-89b0-8f032a8d11fe', '37509f38-6adc-4ef1-8386-42d58077ea1d']" +deepseek-ai/DeepSeek-V3.1,chess-best-move,5,"['b9080d52-635b-47fd-8ad4-2f2847029136', 'b008c349-bf1d-4b2d-8471-93a5ffc60331', 'b66f9625-a8c4-487d-b5f0-9db98fe2da4e', '4b4cd1fd-32aa-443d-9e6c-743274ed6410', 'c35e2e8f-9cfc-43f0-8015-5da494476702']","['chess-best-move__auMcGYR', 'chess-best-move__oMizB6b', 'chess-best-move__7fzCXKg', 'chess-best-move__oxNbqAD', 'chess-best-move__rTqLSkf']",0,"[422.05488, 196.529202, 410.467958, 565.509823, 888.240521]","[100.134359, 26.416025, 7.871477, 13.849878, 53.753498]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,circuit-fibsqrt,5,"['2fb59493-02c3-4696-a2ec-50353ae36f25', '3809efb8-5704-4b2c-88b2-d3a3ac7e6577', '9b9db535-975e-4280-b7ac-1467f1351b92', '202f5a30-bc3d-4e59-9c49-d6510a12d1cd', '190bba7d-c99f-4797-b234-c4458aa77244']","['circuit-fibsqrt__bw6p7Sq', 'circuit-fibsqrt__XKjxduM', 'circuit-fibsqrt__7NwkP2p', 'circuit-fibsqrt__SLoeTqB', 'circuit-fibsqrt__FKoZd9n']",0,"[3622.24772, 2121.039872, 1024.611893, 1826.480872, 2142.042451]","[71.962103, 18.893107, 77.695536, 134.426677, 12.155171]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,cobol-modernization,5,"['f42c6a34-07c6-44bb-991f-1d45c2020542', '5c5e338a-cd06-4c00-9a96-2996381e18bf', 'd3d2d894-f879-4c43-93bc-6304b67ee4c5', '3550fb97-b4ff-4154-b1d1-303a3983cf81', 'd0f3aada-4fde-403b-8b42-d3f7ffa51204']","['cobol-modernization__cdrdMbw', 'cobol-modernization__pfNHNSz', 'cobol-modernization__JN6aoN8', 'cobol-modernization__CXRbhM4', 'cobol-modernization__2dm4Pob']",3,"[512.576236, 779.133076, 915.780992, 915.748719, 774.324846]","[41.672847, 35.608232, 53.154114, 52.403003, 78.450857]",0.6,True,"['f42c6a34-07c6-44bb-991f-1d45c2020542', 'd3d2d894-f879-4c43-93bc-6304b67ee4c5', '3550fb97-b4ff-4154-b1d1-303a3983cf81']" +deepseek-ai/DeepSeek-V3.1,code-from-image,5,"['f715ce5e-fe2a-48e1-b230-ae62244908c2', 'c8c67d8c-d6a3-4f00-9d2f-447353538b74', 'd9238b7c-668e-4609-b5e5-0348a0f792f4', '852834ef-c68a-46c2-8b92-2bc2682619cd', '454bb4cd-caef-48d8-a10d-65d29963c25e']","['code-from-image__3ZhPyFL', 'code-from-image__47JEUk2', 'code-from-image__NgYpMVU', 'code-from-image__gHTToiF', 'code-from-image__Df6Sxgv']",3,"[104.090577, 1225.531146, 163.461342, 1137.019798, 779.911904]","[26.752097, 71.179963, 15.752991, 31.01923, 37.262629]",0.6,True,"['f715ce5e-fe2a-48e1-b230-ae62244908c2', '852834ef-c68a-46c2-8b92-2bc2682619cd', '454bb4cd-caef-48d8-a10d-65d29963c25e']" +deepseek-ai/DeepSeek-V3.1,configure-git-webserver,5,"['395884b6-086c-449b-b11a-154a70c69e32', '3460bc75-a208-4ce6-a53e-ced1a201f24c', 'fbd7997a-754f-4649-9ae4-6d6e516dd222', 'e32b93fd-1ba5-4760-b14b-b6ab067ae1fc', '989b4cfe-2edf-4000-bfde-902f45637d88']","['configure-git-webserver__vS768Mm', 'configure-git-webserver__yQw9JB6', 'configure-git-webserver__PLYVREt', 'configure-git-webserver__9jioQoR', 'configure-git-webserver__nBKY6F6']",5,"[335.815698, 237.602154, 684.642626, 383.410069, 326.769556]","[17.705084, 28.14268, 148.734487, 59.081631, 39.70912]",1.0,True,"['395884b6-086c-449b-b11a-154a70c69e32', '3460bc75-a208-4ce6-a53e-ced1a201f24c', 'fbd7997a-754f-4649-9ae4-6d6e516dd222', 'e32b93fd-1ba5-4760-b14b-b6ab067ae1fc', '989b4cfe-2edf-4000-bfde-902f45637d88']" +deepseek-ai/DeepSeek-V3.1,constraints-scheduling,5,"['52dd0a42-0529-4ff2-b822-33120fb18a63', 'da8185e9-c7cd-4580-87cc-126d4d3ff0ba', '79960a0a-c5aa-4468-a339-d3845f498f43', 'f668dff4-7763-4ed2-82d4-6ba8e462bf1e', '93ab80c4-8742-4f21-8a56-77e20d3afef6']","['constraints-scheduling__CJvPCXq', 'constraints-scheduling__cUT72MN', 'constraints-scheduling__nvG4BYS', 'constraints-scheduling__pqdvYwM', 'constraints-scheduling__tLrtNuK']",4,"[462.471271, 357.755916, 350.990819, 253.174731, 212.512964]","[143.130978, 30.872932, 134.142797, 37.300909, 41.011833]",0.8,True,"['52dd0a42-0529-4ff2-b822-33120fb18a63', 'da8185e9-c7cd-4580-87cc-126d4d3ff0ba', '79960a0a-c5aa-4468-a339-d3845f498f43', '93ab80c4-8742-4f21-8a56-77e20d3afef6']" +deepseek-ai/DeepSeek-V3.1,count-dataset-tokens,5,"['108bcdc9-f2bb-4c9b-ad1a-3d92c097462d', 'e21d5e09-1e84-4f46-ba25-82c475a5254e', 'a9e1875e-b84d-47de-9f50-f60cbaff12ad', 'd4d717d4-2fae-4fab-80b8-112fe58968c1', 'f168d391-0770-427c-8bec-b272105f2439']","['count-dataset-tokens__jrsttCE', 'count-dataset-tokens__k9h8FwK', 'count-dataset-tokens__dSon9ie', 'count-dataset-tokens__Vhmc57c', 'count-dataset-tokens__RLeJkVa']",0,"[794.54257, 741.614968, 919.91295, 919.248923, 616.656743]","[23.647681, 99.6724, 133.755854, 28.638403, 14.885999]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,crack-7z-hash,5,"['849a7209-4d31-44c5-92e2-e580ba21d6c5', '639d9c82-f31c-480c-9096-f6e05b2e7cfa', '7e21ae14-e04c-4f63-a7cf-836fbacf25d6', 'e212ca2d-37e8-4daa-a982-a7d2bd470bad', '5a599397-d5d1-498b-9ba0-6062f8a33ce1']","['crack-7z-hash__RUzb7Sn', 'crack-7z-hash__PkGzHuB', 'crack-7z-hash__mSRRPpc', 'crack-7z-hash__9E7p96R', 'crack-7z-hash__xGo8agC']",4,"[683.427737, 337.754947, 435.919866, 730.519052, 608.895771]","[27.724485, 19.4881, 46.906917, 31.084438, 10.861223]",0.8,True,"['849a7209-4d31-44c5-92e2-e580ba21d6c5', '639d9c82-f31c-480c-9096-f6e05b2e7cfa', 'e212ca2d-37e8-4daa-a982-a7d2bd470bad', '5a599397-d5d1-498b-9ba0-6062f8a33ce1']" +deepseek-ai/DeepSeek-V3.1,db-wal-recovery,5,"['c415280f-a7d7-42f9-b619-96e962697aef', '8af0a91e-0c19-4366-86bb-128e0b8970f5', 'a4f7e7ac-78e2-4161-ba82-d948d89f8808', '92c6c990-00ce-4d3c-a165-6902bffa6d9d', 'c6f2cc08-9c24-4363-81ee-5b4493812064']","['db-wal-recovery__i7ypHRU', 'db-wal-recovery__7NLwVvJ', 'db-wal-recovery__hg2GPWT', 'db-wal-recovery__qwqjnWm', 'db-wal-recovery__M6XXZfn']",0,"[904.307912, 917.66822, 924.011394, 903.474161, 244.736084]","[25.894753, 48.873989, 42.378645, 32.025021, 12.709558]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,distribution-search,5,"['e56b5895-7bc5-4aba-9b33-78c32c3514b6', '4a627791-94be-48e9-a2d7-3b34944e2fc6', 'c5b97de4-2ba6-4e4e-869e-706eca38cb75', '4e1fda26-3afc-4927-a098-c1b6734a5939', 'ce017748-368f-4b27-835a-f551abb9cc1d']","['distribution-search__yukxDMX', 'distribution-search__Pdnyfmy', 'distribution-search__7VQDscy', 'distribution-search__c4e3DvS', 'distribution-search__S7pksts']",0,"[1247.073547, 1203.850305, 701.194769, 2101.630507, 1200.075023]","[176.507417, 14.312489, 23.861367, 51.795613, 149.408664]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,dna-assembly,5,"['c0f0649a-6e76-490f-b918-14e908dac67f', '131e5124-bb20-4ad5-aa84-74e8a013b13f', '961df3ac-84a2-42a7-8a33-d7ae773af3a1', '768daabf-6d64-4c42-bbf4-3746519d38ee', '14cf5a59-e1c1-4fa4-9511-8811bb56b711']","['dna-assembly__ETiuvzV', 'dna-assembly__TvJXabr', 'dna-assembly__tw7N6dL', 'dna-assembly__DWcLP9w', 'dna-assembly__Ef4v4Di']",0,"[249.394607, 245.836465, 95.402357, 257.260316, 720.039977]","[20.886514, 81.948431, 42.438748, 39.834675, 125.358087]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,dna-insert,5,"['645746e6-645e-4c35-9afc-87f4d2a6422e', '4772b338-83aa-4288-8a8b-e8312fc64437', 'a30284fc-2f41-4915-a4f1-87cd77e32f83', '9dd17647-8349-464f-b183-4d543bfb4e7a', '69d0c7c5-795e-4b27-aeef-1d661fe4c8c6']","['dna-insert__5XN2LQK', 'dna-insert__87AG7zT', 'dna-insert__esfdLUM', 'dna-insert__V9ZksDT', 'dna-insert__Zd75UJJ']",0,"[180.13392, 367.339669, 360.002678, 631.8803, 411.636049]","[44.01344, 14.238747, 304.078276, 315.459758, 21.519115]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,extract-elf,5,"['9c813aee-a81d-4e90-8df8-f61b2dd81087', 'b0173bb2-013c-4542-b3ee-9fc316f66109', 'ea269c16-b482-46ed-9c5d-a6b39001f60b', 'ace5adf7-b5aa-493d-80cd-60b0824e7b52', '87bae500-5a3b-49dc-9328-e36c86f7d831']","['extract-elf__3uaNshJ', 'extract-elf__cxckdG7', 'extract-elf__ykkz2yc', 'extract-elf__ozeE3a7', 'extract-elf__J5jdTU2']",3,"[245.552533, 319.546535, 298.164443, 147.410969, 319.228374]","[81.998392, 50.186173, 16.545043, 21.906612, 21.973392]",0.6,True,"['ea269c16-b482-46ed-9c5d-a6b39001f60b', 'ace5adf7-b5aa-493d-80cd-60b0824e7b52', '87bae500-5a3b-49dc-9328-e36c86f7d831']" +deepseek-ai/DeepSeek-V3.1,feal-differential-cryptanalysis,5,"['af16970b-760f-4caf-aa56-b55320bc0afd', 'cd9cffee-c3dc-43eb-9b49-90bf814d6d4b', '26ad594b-f57e-4149-8603-5f0f30164e7d', 'a6cb4836-4784-458c-97e4-cf7b1276c3e7', '2701c142-1dc6-4d92-ba86-a37a7a87941e']","['feal-differential-cryptanalysis__XDyNJ5B', 'feal-differential-cryptanalysis__jerj8rR', 'feal-differential-cryptanalysis__uGpLq3t', 'feal-differential-cryptanalysis__YjiAvdu', 'feal-differential-cryptanalysis__odoo3BL']",0,"[552.497041, 121.222539, 1332.276715, 313.832335, 1800.03677]","[225.409529, 140.194093, 47.788635, 29.331469, 21.132024]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,feal-linear-cryptanalysis,5,"['d4916c40-e25f-4b8a-bc1c-53ee5faa10e4', '8f93f8dd-bda1-43da-90bb-3e34a4ced6a1', '9a79396a-1977-420d-83f7-de94cbe1967f', 'b3fe8586-e0be-4bbd-8c17-ebb4a4e957fb', 'ac37274f-8aa4-4e32-b192-db89f2d4fced']","['feal-linear-cryptanalysis__xkKcQsv', 'feal-linear-cryptanalysis__cz9hC9s', 'feal-linear-cryptanalysis__Qb8Tebv', 'feal-linear-cryptanalysis__aNE4VVo', 'feal-linear-cryptanalysis__LRat4fj']",0,"[1814.528365, 1810.565133, 1808.716178, 1808.088625, 1820.259437]","[42.834793, 18.892887, 40.811034, 89.752552, 359.702298]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,filter-js-from-html,5,"['fd093889-93f5-47c5-95d3-d0847d43aad2', '534d4f44-c66f-4e1b-9c66-4d0fe1c6921c', '0d643e75-f492-44a8-92b3-10cd14ea0adb', '2a304c8f-ce37-449c-a47d-11d081360303', '0e56eaff-4316-4999-b939-3bcb50d11950']","['filter-js-from-html__ABdbVj5', 'filter-js-from-html__m6eAQbw', 'filter-js-from-html__A9MS62M', 'filter-js-from-html__5pzjWw4', 'filter-js-from-html__7pSRdKV']",0,"[465.015467, 40.795824, 789.684955, 155.615752, 277.571057]","[19.805745, 40.05017, 48.627263, 25.868788, 29.5216]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,financial-document-processor,5,"['b47d132b-0864-458b-941a-c35c3025ecc0', 'd469004d-7c96-4869-bdb3-32a99db4bad8', 'c6bf4b33-112b-48a8-b43d-2d148873923b', 'a01bedaf-0430-4429-b7c5-12f4a8a8206d', 'e5c32866-2596-4e0a-8412-b2baf48c4f6e']","['financial-document-processor__An7eAV5', 'financial-document-processor__jrjEfB7', 'financial-document-processor__QBPqziP', 'financial-document-processor__XAK4xDi', 'financial-document-processor__PWkVPxT']",0,"[354.047559, 448.614275, 1236.746396, 424.338483, 307.804841]","[49.340994, 21.349346, 45.264818, 126.935961, 128.461982]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,fix-code-vulnerability,5,"['65b0dcb8-abb9-4d90-8d84-9cee6791cfe5', 'bf977a62-01be-461b-8f59-a89b02628300', '52738a4c-dc37-41c8-85c8-19b5dcbe35c0', 'ae7b7011-1497-4ef7-9be6-533162879319', '2d57e2ad-f4f8-4f8c-b800-86d71a2c57a3']","['fix-code-vulnerability__5FwPjiG', 'fix-code-vulnerability__MH3def9', 'fix-code-vulnerability__fz2Q74c', 'fix-code-vulnerability__BFDueSk', 'fix-code-vulnerability__2G8Kouy']",1,"[541.276845, 572.617767, 1009.212331, 905.706249, 905.596019]","[29.890409, 76.299225, 6.139469, 14.718565, 11.786505]",0.2,False,['65b0dcb8-abb9-4d90-8d84-9cee6791cfe5'] +deepseek-ai/DeepSeek-V3.1,fix-git,5,"['c82a7958-26c2-41fe-9307-8fb583d2ade4', '84cac82c-cf22-42ea-a3e6-aff009f532ce', '84aa667d-cc24-4886-9042-33872de44c29', 'a0b5aa9d-3733-451d-ab04-0faae65c02b4', 'ea45e8cf-2f4c-472b-b6dc-c792a28ece5f']","['fix-git__DSZLmhU', 'fix-git__bFBNec7', 'fix-git__EDy85et', 'fix-git__USNogzd', 'fix-git__6P8L6JD']",4,"[916.094816, 198.331857, 688.741257, 1711.423649, 85.629739]","[44.130259, 16.95277, 44.255298, 102.632489, 30.582927]",0.8,True,"['c82a7958-26c2-41fe-9307-8fb583d2ade4', '84cac82c-cf22-42ea-a3e6-aff009f532ce', '84aa667d-cc24-4886-9042-33872de44c29', 'ea45e8cf-2f4c-472b-b6dc-c792a28ece5f']" +deepseek-ai/DeepSeek-V3.1,fix-ocaml-gc,5,"['9d500747-e08e-404b-98eb-9307a901745d', '3c6580cc-8ecb-40ed-b72d-5baca655ad05', 'f96e7606-ded0-4ecb-801a-b7d70ff5bd4a', '03667af4-0c30-4352-ab3b-9ce5de3059d1', '5403e91f-05ca-4b8e-a964-3c117c60bc5f']","['fix-ocaml-gc__Wu8CcJr', 'fix-ocaml-gc__pq9HwCF', 'fix-ocaml-gc__d3vBnYQ', 'fix-ocaml-gc__ric9DMz', 'fix-ocaml-gc__s5LYrGJ']",0,"[2767.206252, 3612.920111, 1970.995101, 3284.454139, 3705.862011]","[44.258249, 121.691373, 119.813493, 19.735997, 164.084239]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,form-filling,5,"['37570c15-1821-4744-9b4b-e6025a08e3b5', 'f8d8f335-00ed-461d-bac5-fdad6d3d6857', '1d2e5304-d74f-4073-aa5f-9c3a9743d2d6', 'd9be2078-30c2-4de2-a095-53d2c0ed7253', '5751c21c-5cf6-40d9-897f-7082225a2b12']","['form-filling__F2BmsHZ', 'form-filling__hgmwsJu', 'form-filling__3bUZUiE', 'form-filling__PESgTUK', 'form-filling__23iK2mT']",4,"[263.519789, 207.304221, 433.218726, 2067.753321, 478.384476]","[3.754464, 3.602149, 64.783669, 16.731642, 48.544069]",0.8,True,"['37570c15-1821-4744-9b4b-e6025a08e3b5', 'f8d8f335-00ed-461d-bac5-fdad6d3d6857', '1d2e5304-d74f-4073-aa5f-9c3a9743d2d6', '5751c21c-5cf6-40d9-897f-7082225a2b12']" +deepseek-ai/DeepSeek-V3.1,git-leak-recovery,5,"['8312196b-b53b-48e3-a104-63dc0ce91ed3', '455b84ed-16fe-4d1b-8c20-5eded2d7c0f7', '3e9a6a89-ba8b-475d-af05-9fb438faa9d7', '030f820b-00df-4821-9836-bda4f095663d', '0335bd61-ed5b-43a8-a41c-782f7dd20693']","['git-leak-recovery__3QPg6UK', 'git-leak-recovery__RJEwBCy', 'git-leak-recovery__7eS9dS4', 'git-leak-recovery__vDWbLVp', 'git-leak-recovery__bLWGqyB']",3,"[365.090115, 86.361018, 234.1554, 143.5472, 177.017306]","[35.069824, 31.718289, 70.036249, 20.652028, 27.383082]",0.6,True,"['8312196b-b53b-48e3-a104-63dc0ce91ed3', '455b84ed-16fe-4d1b-8c20-5eded2d7c0f7', '030f820b-00df-4821-9836-bda4f095663d']" +deepseek-ai/DeepSeek-V3.1,gpt2-codegolf,5,"['7d3aaf4d-cfd0-4ddd-96a1-3051d7006ac7', '1dbac28f-2e0c-4516-9e2f-460a389c2edf', '54c0dcde-65f0-4890-a479-ae42f67f6764', '6615f05e-c2ed-49b6-bf01-96a712db82df', 'ff5cd529-5759-4b07-a7b4-eb1e3cbb354a']","['gpt2-codegolf__DQiU6pU', 'gpt2-codegolf__NLWzt28', 'gpt2-codegolf__fnokoRz', 'gpt2-codegolf__QRYPbUF', 'gpt2-codegolf__nNps7YR']",0,"[906.423934, 334.100522, 901.040115, 903.040607, 696.311305]","[46.455233, 86.262946, 232.242911, 35.302506, 123.887849]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,hf-model-inference,5,"['74b9173e-a84f-4d54-a457-3f778769eb98', 'd90bf36b-518c-42b3-9255-110f25defc72', 'fd6ffe19-2b47-4463-aa15-f2fc1806f720', '1e865dba-6639-4ba7-96ef-63d134946042', '7487f5bc-9577-45cb-bf52-de7abb21f26b']","['hf-model-inference__qRpKViy', 'hf-model-inference__HeRWEvW', 'hf-model-inference__cgjejNz', 'hf-model-inference__HxR6WQS', 'hf-model-inference__RfNnMG3']",4,"[152.424247, 912.199275, 437.601852, 274.85526, 594.03429]","[37.60493, 305.015179, 61.42838, 36.482142, 56.455115]",0.8,True,"['74b9173e-a84f-4d54-a457-3f778769eb98', 'd90bf36b-518c-42b3-9255-110f25defc72', 'fd6ffe19-2b47-4463-aa15-f2fc1806f720', '7487f5bc-9577-45cb-bf52-de7abb21f26b']" +deepseek-ai/DeepSeek-V3.1,install-klee-minimal,5,"['58a73405-8b97-4458-89da-287c9dc561e1', 'c1972cc1-8185-4a4f-bd8b-0bb2dca36c8a', '00ba2e3f-ac3c-4c49-bcdd-9956db30b810', '24bdd134-0be1-428e-87e9-39b14059ccf1', '940dac43-4203-46fe-88cc-9cab0486c7f3']","['install-klee-minimal__yjPegsm', 'install-klee-minimal__Z4J5cDj', 'install-klee-minimal__HtmFhdU', 'install-klee-minimal__87cfuvd', 'install-klee-minimal__nyrpNjT']",0,"[948.324873, 900.050293, 900.52118, 904.257814, 1730.107276]","[9.39458, 74.192458, 253.845365, 119.615534, 48.208827]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,install-windows-3.11,5,"['9b9f8148-5bb0-4f82-be14-16099f5bf93e', '91597cc2-906a-49f3-870e-f77ca9a3822c', '66c33fcb-659e-4812-8644-634fd8bc99fb', 'fcd53fec-4fb7-486a-827b-719e3f5ce8cc', '7e889790-c074-471d-b3cf-a1c28e3e95bf']","['install-windows-3.11__tjViFu5', 'install-windows-3.11__3m8LAKA', 'install-windows-3.11__fuyuhBE', 'install-windows-3.11__WDKS9ru', 'install-windows-3.11__Eq8Gd4Y']",0,"[183.731293, 1306.532762, 335.310874, 960.011897, 629.727973]","[43.427765, 39.688357, 29.732468, 16.40558, 33.139542]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,large-scale-text-editing,5,"['6039b297-c1ce-460a-b6c6-492f6a154c92', '6265fc34-cc3b-44a7-a5e2-97e10bb3282c', '80e5171d-2f59-4b46-911f-51567c16e20a', '8b92fefd-ddff-41ee-a57a-24fe7fdfcceb', 'c0f03aa3-64b2-4172-bd3c-9018bd73faf9']","['large-scale-text-editing__BfHikxn', 'large-scale-text-editing__8FdjjxH', 'large-scale-text-editing__cEJsxid', 'large-scale-text-editing__iGsNN4T', 'large-scale-text-editing__o93LKa6']",0,"[906.150451, 337.414913, 646.635553, 827.301076, 1204.830639]","[19.789111, 9.861267, 24.503608, 266.138266, 79.161949]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,largest-eigenval,5,"['7bb024c7-011a-4b66-8e79-188a2df3f5cf', '467c27cc-4a7c-42e4-b52e-40b29d1744ff', 'a1cf1b4c-f1e7-406f-965e-cafebd80f2da', 'a1956742-d1f4-4666-a5a0-000704d5d205', '60d33963-3c6e-46ee-8374-b89961aa210a']","['largest-eigenval__uhNEy5e', 'largest-eigenval__7NctuQC', 'largest-eigenval__w3uS6jY', 'largest-eigenval__ZdUo7nR', 'largest-eigenval__MQgRxEy']",1,"[909.685033, 739.444421, 837.504525, 815.661122, 317.239354]","[190.63793, 129.116569, 87.445816, 52.789683, 51.748982]",0.2,False,['a1956742-d1f4-4666-a5a0-000704d5d205'] +deepseek-ai/DeepSeek-V3.1,log-summary-date-ranges,5,"['6b942f33-a4d6-43c2-a4fd-4c43aa0a3f2f', 'ea6755e0-4673-40dd-a376-0b89aca8b8b6', 'dcb775a5-e9a4-4a7b-8e39-80d43e4438ed', '00a11fa8-017d-4c21-937d-fcab17c00c82', 'fb5bc37e-1e80-42fb-8a1d-e97fb65dc585']","['log-summary-date-ranges__wQPce89', 'log-summary-date-ranges__3MXBTNt', 'log-summary-date-ranges__8soXaKX', 'log-summary-date-ranges__AkhrhzQ', 'log-summary-date-ranges__iWZpfHR']",2,"[296.870361, 120.690841, 288.142412, 144.934484, 107.215657]","[29.407658, 43.058517, 35.379474, 29.451679, 13.06501]",0.4,False,"['6b942f33-a4d6-43c2-a4fd-4c43aa0a3f2f', 'dcb775a5-e9a4-4a7b-8e39-80d43e4438ed']" +deepseek-ai/DeepSeek-V3.1,make-doom-for-mips,5,"['1a0eeb4e-7643-4cfe-8e00-546c0bede239', 'db558e6c-919d-433d-914b-b8d32d8196d6', '2442d7a0-f4d3-4d39-8e66-328c910d1a6e', '15600a7e-617c-497b-b760-32a2c35797f9', '1397f4e3-d908-4677-a0a3-afb6f942cb67']","['make-doom-for-mips__F7C7NY7', 'make-doom-for-mips__mKwJDUR', 'make-doom-for-mips__9u6cAUk', 'make-doom-for-mips__yv9QAHU', 'make-doom-for-mips__CkidpG3']",0,"[972.667, 900.002539, 806.154215, 904.182245, 644.990417]","[39.346422, 160.776129, 46.706863, 31.064751, 75.327566]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,make-mips-interpreter,5,"['8751a7d3-425e-44f5-8eb5-19bc6a9ad8b5', 'f7854252-a966-49af-bc48-fbaf7ca73a72', '7254b1bb-c27f-413b-b258-903a6674bc41', 'd8d31239-200b-465a-ab52-bb71630fd201', 'ac16808b-7371-4eb5-ab24-3359199c89ee']","['make-mips-interpreter__SeMyQxJ', 'make-mips-interpreter__F4Hbjbu', 'make-mips-interpreter__3nkbfkC', 'make-mips-interpreter__tAJiSSV', 'make-mips-interpreter__35pmsGy']",0,"[1831.131574, 1800.93035, 1478.041645, 1801.022778, 1174.320946]","[11.165103, 87.124576, 251.214128, 30.595042, 29.957896]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,merge-diff-arc-agi-task,5,"['67f5577d-b536-4e8c-be75-7247fe54d22f', '7a1a3b6f-8ba9-48ce-8d62-b3efa7fdd92b', '6752cd91-6165-402d-9106-ed358112f4ab', '97fcdb6c-20d8-433f-abd1-c71b85cd7324', 'a55e2ca9-c471-412f-8960-74314bec3eb8']","['merge-diff-arc-agi-task__BUTSUeS', 'merge-diff-arc-agi-task__EbLF3xv', 'merge-diff-arc-agi-task__YskscFi', 'merge-diff-arc-agi-task__AjXcZRC', 'merge-diff-arc-agi-task__ibGMyBa']",1,"[915.268858, 235.582091, 900.059339, 387.762671, 936.71914]","[99.485874, 13.861496, 70.94192, 20.063012, 70.946448]",0.2,False,['7a1a3b6f-8ba9-48ce-8d62-b3efa7fdd92b'] +deepseek-ai/DeepSeek-V3.1,model-extraction-relu-logits,5,"['bdd04e74-d3e7-461d-87bf-1eb0b099edaf', 'd134c23e-d8aa-40ce-a71e-13709434bdb9', '5a788267-8374-4452-a3a3-795d9b0061e7', '0380d20f-a843-427a-a5a1-7f3ff93cd53d', 'a5e241b7-ccf6-42cb-ad6f-e14b9467d228']","['model-extraction-relu-logits__pzNW4Qi', 'model-extraction-relu-logits__j3TXr2R', 'model-extraction-relu-logits__bv5Y5cx', 'model-extraction-relu-logits__LMTbffa', 'model-extraction-relu-logits__XtV7rYD']",1,"[197.996922, 1025.870373, 798.141034, 463.33761, 321.638095]","[35.154049, 58.342987, 9.714415, 333.905323, 127.994143]",0.2,False,['bdd04e74-d3e7-461d-87bf-1eb0b099edaf'] +deepseek-ai/DeepSeek-V3.1,mteb-leaderboard,5,"['a642e599-09ef-478e-8be8-31183a6cd191', '91a43c48-4e40-43b4-b817-1117a64ddd41', '0f6a60dd-f49e-42e8-9efc-001126ec6763', '7c3c447d-b445-4dc5-8b66-411e925dd48f', '6a0230e5-b755-439c-845e-c652bf805aeb']","['mteb-leaderboard__U8K6SEY', 'mteb-leaderboard__coepp29', 'mteb-leaderboard__jM66HLq', 'mteb-leaderboard__SdZ72b2', 'mteb-leaderboard__SmYyMYt']",0,"[190.981321, 850.794505, 150.642923, 177.014717, 100.276781]","[3.988825, 45.756038, 63.501823, 4.228861, 20.629201]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,mteb-retrieve,5,"['4d8626aa-b16a-4b73-9396-2a78c86263c7', '9c253fb8-8230-4a81-9939-e549a065a59d', 'a799dc74-2b21-4dc4-9676-f2ec02d46b72', 'b15f9917-b080-4007-85c0-461f6a5172c8', '1ecbe457-d3d2-45cd-91e3-7b2a8b3b576d']","['mteb-retrieve__qBtUjDK', 'mteb-retrieve__igez96A', 'mteb-retrieve__wkkWAUL', 'mteb-retrieve__puQ2Kgr', 'mteb-retrieve__pQkb4x5']",0,"[85.97783, 247.913123, 195.511405, 125.278376, 185.611729]","[40.487382, 87.556231, 13.889505, 9.968564, 151.556578]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,nginx-request-logging,5,"['d55dee49-5c23-4134-9081-633c2b231440', '43f117d1-4663-4dd6-b0c4-79bd41ec21d1', 'b6387e81-c754-4704-a30c-e7013a23b8f3', '3a7177c5-e63f-4db2-a6d0-192a4d9eef02', '2bdb9791-14df-4b86-8d4b-31cc305586b4']","['nginx-request-logging__zYaRKy6', 'nginx-request-logging__5TFxVDx', 'nginx-request-logging__Auj2Egk', 'nginx-request-logging__qdn7b6Y', 'nginx-request-logging__zEDa78A']",2,"[510.60575, 411.122519, 420.484928, 147.721254, 516.587813]","[61.6697, 37.097807, 32.744698, 12.724627, 66.539996]",0.4,False,"['3a7177c5-e63f-4db2-a6d0-192a4d9eef02', '2bdb9791-14df-4b86-8d4b-31cc305586b4']" +deepseek-ai/DeepSeek-V3.1,openssl-selfsigned-cert,5,"['7ebb4290-803f-486c-b928-6409d9dc417d', '2622034c-f0f0-43a7-b181-c0029ace9380', '3d0a4824-e96e-4fa6-a694-344abeb3c8ad', '4b3e9157-d36a-4fc0-841b-ca70a5656b4b', '298ce628-6e43-4625-9581-800bdf02f2be']","['openssl-selfsigned-cert__sPdtLb5', 'openssl-selfsigned-cert__dsRSnSx', 'openssl-selfsigned-cert__8MCSyjJ', 'openssl-selfsigned-cert__TD4k2cX', 'openssl-selfsigned-cert__XvLiD5R']",5,"[298.786631, 552.602063, 219.22409, 208.543046, 125.310997]","[64.636382, 52.666487, 27.002923, 23.029872, 14.286894]",1.0,True,"['7ebb4290-803f-486c-b928-6409d9dc417d', '2622034c-f0f0-43a7-b181-c0029ace9380', '3d0a4824-e96e-4fa6-a694-344abeb3c8ad', '4b3e9157-d36a-4fc0-841b-ca70a5656b4b', '298ce628-6e43-4625-9581-800bdf02f2be']" +deepseek-ai/DeepSeek-V3.1,password-recovery,5,"['3e9afe9b-db9a-43e8-a4b8-b907adcfab7e', '061275aa-d075-4b06-a631-2beb561da44b', '42d94c9b-ee4d-4fb8-8dee-d5adfbddc7f7', '606da5f6-091d-4f1e-9220-d1cacd740efc', '81245d0c-d98b-4f80-b719-f9c193bd5711']","['password-recovery__DHFHUXx', 'password-recovery__x5hp7AT', 'password-recovery__8oHpHSL', 'password-recovery__AbPtSAX', 'password-recovery__fhEQaM5']",0,"[902.604878, 915.1463, 1324.567928, 906.732553, 767.896977]","[83.324817, 47.998666, 227.003482, 82.867484, 34.458011]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,path-tracing,5,"['9f47b0e3-05bb-4703-a172-76b774201914', '3df36c48-c757-47f8-a4fa-ec2c58162411', '04f840a0-3164-4f41-95e2-356df2c198bd', 'b0944d34-ea3f-4453-8fec-003053e20b08', '4028c47b-3410-4e57-83d1-4af1ff19dccc']","['path-tracing__X9VLfT5', 'path-tracing__K3zfGMm', 'path-tracing__cjYaHKd', 'path-tracing__un86Rva', 'path-tracing__pJ3Xdjc']",0,"[622.446642, 573.872056, 1803.631786, 1129.965242, 1031.468274]","[31.567199, 21.927178, 17.419002, 70.009453, 111.640624]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,path-tracing-reverse,5,"['b06b8e32-eec1-4113-961f-72a24749878b', '1c7e74ed-9c6a-48f6-b3f6-6ee6c40af43f', '3573a9b3-362a-4a88-83bf-babc2e692a3c', 'ebdf4de3-4492-47ad-9d54-6035269558e4', '7b78c7f2-6063-4274-8d97-2c2d986f1ce2']","['path-tracing-reverse__mVANxYH', 'path-tracing-reverse__D5pbrPn', 'path-tracing-reverse__yztqF4A', 'path-tracing-reverse__ifNgM8u', 'path-tracing-reverse__tzFdnyV']",1,"[1808.218798, 926.290808, 1403.807946, 1435.217047, 872.788249]","[96.238719, 34.675158, 37.550997, 43.845971, 32.390755]",0.2,False,['ebdf4de3-4492-47ad-9d54-6035269558e4'] +deepseek-ai/DeepSeek-V3.1,polyglot-c-py,5,"['67494241-47ce-4f91-b593-52dcc57f4f62', 'a16185be-39fb-4cd9-8ec8-a7c0a2697e3a', '97275d32-d710-410c-8ca8-0a84a9b187f7', '87f22486-c143-4c00-b7a1-1ef07f5d4862', '8db0f589-2478-4fc8-8ef9-019ec342543d']","['polyglot-c-py__JqBHBBb', 'polyglot-c-py__hMCJqAE', 'polyglot-c-py__wGRTriS', 'polyglot-c-py__576wVWY', 'polyglot-c-py__yQnqyAg']",0,"[912.715277, 919.667277, 900.001377, 989.25217, 901.604527]","[15.886815, 22.910812, 50.475051, 50.187859, 36.312288]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,polyglot-rust-c,5,"['82f712df-a525-482b-9571-4d0058cadbb4', 'aba0717e-fae8-4fda-a51c-ad26020e0f94', '361a1a5e-a9ed-4634-945c-c0cc72170616', '30ea6998-7bf6-4c27-a0f3-820a80c5acf7', 'dd85c226-f2b7-46f2-9d89-3de1e09421f7']","['polyglot-rust-c__hJLaw3d', 'polyglot-rust-c__ie75R9W', 'polyglot-rust-c__yzv7h8Y', 'polyglot-rust-c__YmAb24Q', 'polyglot-rust-c__4qLeTnC']",0,"[900.001404, 389.171353, 923.808872, 883.643068, 907.601446]","[47.55927, 28.279743, 28.287978, 282.796892, 99.890967]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,port-compressor,5,"['62edb066-bb81-4e37-8f28-c90baefc7b23', '80a8b87c-8828-45a0-b7a4-84c875a8d38c', '4d7eb9bf-cb85-4a1d-902d-409a93a062f5', '86622a61-f9e8-4d0b-92e1-a181fca4b05f', 'b63d7f95-2fbe-40e0-945c-a2ff495c6f8f']","['port-compressor__T5sbMx4', 'port-compressor__8i3bNzz', 'port-compressor__h5tXMdZ', 'port-compressor__9AB44rf', 'port-compressor__zRdCV9e']",0,"[3605.12597, 3606.337451, 3640.213913, 758.673041, 3604.34111]","[41.910806, 44.167858, 38.761534, 11.812336, 123.136006]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,prove-plus-comm,5,"['9110aac7-51a0-4e89-9762-bab6828604c4', '867a3f48-f7ac-46ce-90ee-e8b99b9108a3', 'd4aae31c-9030-4983-b6f1-163c3ce875e9', 'd068d0c2-582f-48b7-9a82-b38acbbb4330', '30afb470-d200-4ae2-a6a0-85ae6904c15c']","['prove-plus-comm__2BvZx9n', 'prove-plus-comm__8xJceP8', 'prove-plus-comm__3w7cM9v', 'prove-plus-comm__3BM5NrT', 'prove-plus-comm__eGeTtpE']",5,"[490.490105, 158.454283, 106.915639, 351.333096, 260.602416]","[157.892259, 60.005401, 26.026621, 90.631934, 58.7375]",1.0,True,"['9110aac7-51a0-4e89-9762-bab6828604c4', '867a3f48-f7ac-46ce-90ee-e8b99b9108a3', 'd4aae31c-9030-4983-b6f1-163c3ce875e9', 'd068d0c2-582f-48b7-9a82-b38acbbb4330', '30afb470-d200-4ae2-a6a0-85ae6904c15c']" +deepseek-ai/DeepSeek-V3.1,pypi-server,5,"['9237f9fe-3088-417c-869c-844ba45a9a96', '6376dd52-f3f3-4d29-92eb-999aa68b0584', '626b6e8a-404a-4037-8682-ac85fa08d911', 'dd29edfb-f115-42ca-b42d-655ebf73d59d', 'd15453ca-0a5b-4980-92b8-d4ab222553fc']","['pypi-server__S8t2i9P', 'pypi-server__U6tsdSm', 'pypi-server__BZZxMiJ', 'pypi-server__9qjY5rX', 'pypi-server__sgnzbYw']",2,"[902.408906, 144.712043, 923.342997, 438.034544, 863.334157]","[11.663242, 49.755196, 46.661007, 21.228238, 21.959606]",0.4,False,"['9237f9fe-3088-417c-869c-844ba45a9a96', '6376dd52-f3f3-4d29-92eb-999aa68b0584']" +deepseek-ai/DeepSeek-V3.1,pytorch-model-cli,5,"['c1f8bae4-037c-4021-86b7-e7be4ef15c1c', '35a419d4-b010-4931-b994-586c5b879f71', 'fd546a0d-23fb-4821-b9cb-505c0ca04752', 'b8424f88-4c20-4594-ab70-baa6344ae901', '1a7e41ab-4ed6-4c9f-b48c-cc31233ad18e']","['pytorch-model-cli__w9y9eDw', 'pytorch-model-cli__u32zygW', 'pytorch-model-cli__ZescuH5', 'pytorch-model-cli__6XLjW8y', 'pytorch-model-cli__y8fQSxN']",0,"[755.537638, 782.216051, 205.551128, 655.597516, 1198.713508]","[15.29616, 30.904091, 34.24271, 72.2889, 152.009718]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,pytorch-model-recovery,5,"['419dd4c2-415e-45ee-a15e-dc05469f9c72', '55386ba2-3251-4485-8ccf-3be1c12d3f94', 'bb20ae24-0979-4e17-94fc-16bff66a856e', '92836f0d-83b3-4aa7-ade3-4b3a007e7174', '1c2a7380-3c92-49e6-aed3-366ab1a18c98']","['pytorch-model-recovery__oZeVMAC', 'pytorch-model-recovery__KNTAW5r', 'pytorch-model-recovery__Ds6Jc6S', 'pytorch-model-recovery__BMpDpak', 'pytorch-model-recovery__P2MeLj2']",3,"[914.39971, 285.598543, 908.910899, 176.558374, 706.758314]","[11.72202, 48.90571, 28.169239, 17.212449, 73.096784]",0.6,True,"['55386ba2-3251-4485-8ccf-3be1c12d3f94', '92836f0d-83b3-4aa7-ade3-4b3a007e7174', '1c2a7380-3c92-49e6-aed3-366ab1a18c98']" +deepseek-ai/DeepSeek-V3.1,qemu-alpine-ssh,5,"['695f2f2e-32dc-4362-aaa2-474e703e8615', 'dcaa9baa-73d6-40fe-b124-3382093504da', 'b9cdca01-ed4d-4c34-91bb-2f20c1f67517', '6333fe25-886b-45ac-983f-189d825d7f89', 'eadaa92e-92a2-4996-a15c-73d13b62624a']","['qemu-alpine-ssh__twQZXri', 'qemu-alpine-ssh__Lwn9A8G', 'qemu-alpine-ssh__raivxXQ', 'qemu-alpine-ssh__VqeyRDV', 'qemu-alpine-ssh__sX9mTJo']",1,"[903.293499, 1045.194376, 902.799817, 907.926095, 323.904361]","[5.251097, 4.478689, 4.106984, 10.895346, 17.105157]",0.2,False,['6333fe25-886b-45ac-983f-189d825d7f89'] +deepseek-ai/DeepSeek-V3.1,qemu-startup,5,"['45113b8f-5122-4a49-819d-f18ec0fd864c', '29f7ddba-4e76-4cac-9614-5e79e5eba6dc', 'f181d90a-b9cd-41b1-b880-709b215f5c14', 'fd26450e-0802-4612-86ef-179e5b4a258f', 'f28694ea-e1ec-45dc-9a07-4863f3418846']","['qemu-startup__zhBPmqr', 'qemu-startup__5TKrrHk', 'qemu-startup__gG9vbdu', 'qemu-startup__pYCi4oN', 'qemu-startup__Vp5dqNM']",1,"[149.373774, 81.613233, 316.110884, 1009.572981, 169.785717]","[4.113803, 7.654813, 29.717376, 6.684607, 3.168345]",0.2,False,['f181d90a-b9cd-41b1-b880-709b215f5c14'] +deepseek-ai/DeepSeek-V3.1,regex-log,5,"['dde7b849-23fd-4465-910e-b76d98eb7d13', '4d33822f-dd89-4688-b02b-ad502a70b8f4', '6c2e55cf-3b8b-436a-bd66-ecb3ae6e3b74', 'fa39bd03-bb5d-445a-aa3d-1313fd1e4ab4', '718c8f43-e58f-40f1-b70b-c3e87a262142']","['regex-log__Z3od9oa', 'regex-log__YLXQadb', 'regex-log__Zfyj8Ho', 'regex-log__szRwDKq', 'regex-log__o6bDsGk']",1,"[144.65089, 170.801851, 159.102717, 136.612886, 123.500391]","[154.361379, 82.783999, 98.117635, 79.236494, 31.723438]",0.2,False,['718c8f43-e58f-40f1-b70b-c3e87a262142'] +deepseek-ai/DeepSeek-V3.1,reshard-c4-data,4,"['4e745656-8035-44fe-b628-eca6c18b7247', '3e75a1dc-6a8e-4009-a673-542bcf460d83', 'f6ef142c-cddf-414e-9068-6f1cac4f6630', 'd295bca6-dd0e-4cf3-893f-a7d8db6ef416']","['reshard-c4-data__gKeWym6', 'reshard-c4-data__VTB7LXw', 'reshard-c4-data__oZw386V', 'reshard-c4-data__3iZDHxR']",0,"[311.898176, 253.422488, 231.644752, 800.145566]","[114.171125, 227.098741, 12.443187, 127.858797]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,reverse-engineering,5,"['8b18dedb-1aec-4eb7-88ad-b1eb1c9cc167', 'c7d2275b-eda7-4853-884c-24d599ad6089', '10c49c67-5897-4bfd-9d09-b0b5afdfd329', '26984e19-0f0e-40c4-876e-0edaef947c3a', '2c5458da-d174-40c0-87c2-1653a701e994']","['reverse-engineering__MDS8GyR', 'reverse-engineering__rir4qsu', 'reverse-engineering__3GkY9GC', 'reverse-engineering__pNjAjPJ', 'reverse-engineering__MKYivMW']",1,"[1805.682187, 513.760676, 496.798506, 1826.775972, 1808.092655]","[72.866182, 21.570233, 29.151617, 198.339851, 59.05894]",0.2,False,['10c49c67-5897-4bfd-9d09-b0b5afdfd329'] +deepseek-ai/DeepSeek-V3.1,run-pdp11-code,5,"['7df3ba0c-109b-4dab-8d0b-ea0bb74ee875', 'f2faf36e-b0f2-43cd-a284-924ff7d50adb', 'a2d20d7e-15bc-4b35-9758-e997bd79f615', '9c0c3e00-8bfc-4b18-9d4d-7e7ff6ab1ee1', 'f28927a8-6e4c-45c7-918b-24048dcc416a']","['run-pdp11-code__VPMEiXM', 'run-pdp11-code__sN26KxA', 'run-pdp11-code__k7evEjz', 'run-pdp11-code__i6AVNR8', 'run-pdp11-code__TG2ESGF']",0,"[1002.31305, 1012.509882, 1002.745341, 1000.335696, 613.385989]","[161.261918, 46.966191, 135.799819, 47.993524, 44.23911]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,sanitize-git-repo,5,"['a1bd368b-70f4-437b-8205-5f04f11eefa4', 'f8432166-343e-4898-b4f1-ba88e47b7de4', '97e28987-629e-4208-8547-62524dd7084d', 'a9c1c270-64db-46e1-86be-a3eebea2218e', '572b1ccd-ce4a-435d-ba9b-c7debe4d9e60']","['sanitize-git-repo__CM8cXob', 'sanitize-git-repo__yyMQTXU', 'sanitize-git-repo__nTXrLgZ', 'sanitize-git-repo__pqF2ci5', 'sanitize-git-repo__UqWRA2u']",0,"[259.682539, 1139.911479, 509.294057, 802.64853, 269.101973]","[214.882639, 39.938417, 33.360377, 19.837654, 13.90798]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,schemelike-metacircular-eval,5,"['3fb77c08-0ac4-45f4-9067-0f4e658855f3', 'cbf27075-def5-4941-83f2-c5d72d4a3357', '1a46f3f1-b9fb-4ebc-b237-591ea5e2c1aa', '5c608902-1e53-4c3f-a80a-748d8db22af9', 'fd4a0bc6-f80c-4d9e-8eaf-9d8a22f3c02d']","['schemelike-metacircular-eval__9MykoAk', 'schemelike-metacircular-eval__2uMhxBi', 'schemelike-metacircular-eval__4EAAKZp', 'schemelike-metacircular-eval__VWGQkeW', 'schemelike-metacircular-eval__2tBRFbQ']",0,"[2407.670819, 2452.70064, 2176.908106, 2320.406535, 1499.610287]","[31.46568, 40.689165, 22.272607, 41.736198, 29.299384]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,sparql-university,5,"['1ddb6f62-5437-4951-96ae-6d69b770cf5d', '7b75891e-17bb-4be9-aaad-b7e6cf32fddb', '5e548c0f-6dae-4f6c-98e0-e4d9ffb1ef17', 'f99b4129-b499-4886-9549-d2951d24dc7b', 'e202023c-29a7-4e16-b0c4-1e18ec6cbd91']","['sparql-university__GkUEsZM', 'sparql-university__yvRotMB', 'sparql-university__RkQJyy5', 'sparql-university__pGX6o52', 'sparql-university__6RyWfeY']",0,"[393.138564, 770.924272, 244.162693, 721.252193, 188.5622]","[73.428268, 65.744344, 49.132983, 104.738935, 107.520021]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,sqlite-db-truncate,5,"['1cd09a7e-a926-42d3-872b-7ee45441cd78', 'fe83ebc1-3ff7-4def-82dd-e60808bb20a7', 'a71ed3c3-4eb6-46c1-9fd6-859ac6b67f17', 'a89e3665-6b62-4a97-a605-9c0f676554a1', '6d7c73bd-3eaf-4645-9d2d-e1a55411354e']","['sqlite-db-truncate__bnjS9Eo', 'sqlite-db-truncate__3VTWptF', 'sqlite-db-truncate__WcdMVE8', 'sqlite-db-truncate__DGFQrC2', 'sqlite-db-truncate__ES66GMF']",0,"[290.578305, 900.063573, 152.114013, 248.433824, 745.641291]","[22.665588, 175.118054, 75.298474, 40.724225, 18.131866]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,sqlite-with-gcov,5,"['5cedf39e-3a28-4040-bdaf-909a91d9efd3', '6338fa2a-0fd2-4c02-935e-2f89055bf215', '97274735-5ad9-422f-bd69-18a5f51b5ce8', '0e55ca86-932f-43b9-ad0b-00f1030783d1', '651239f2-6eae-42f9-9d5a-6c3a0e804e4b']","['sqlite-with-gcov__mv2SSKh', 'sqlite-with-gcov__Ld8LkrK', 'sqlite-with-gcov__Rjkrkau', 'sqlite-with-gcov__9qKraed', 'sqlite-with-gcov__joqdTCR']",4,"[415.302093, 392.713251, 233.986976, 170.473386, 410.989663]","[55.879012, 34.422939, 53.053417, 19.490715, 26.459548]",0.8,True,"['5cedf39e-3a28-4040-bdaf-909a91d9efd3', '6338fa2a-0fd2-4c02-935e-2f89055bf215', '0e55ca86-932f-43b9-ad0b-00f1030783d1', '651239f2-6eae-42f9-9d5a-6c3a0e804e4b']" +deepseek-ai/DeepSeek-V3.1,torch-tensor-parallelism,5,"['8c63a47d-8b03-41a2-99cb-620cd38bbffb', '35e5a5fa-d458-46bc-931d-c5497b6f9c22', 'b015ac8a-4da2-4b05-b6c5-fe3edbcd01d4', '07cf8898-1be8-405e-a40a-2297b5ac347c', 'a0e604e0-a9f2-4f91-b814-79a5ef02240a']","['torch-tensor-parallelism__aAYMPBk', 'torch-tensor-parallelism__EauUivv', 'torch-tensor-parallelism__xHkFDJa', 'torch-tensor-parallelism__PFGFRX9', 'torch-tensor-parallelism__EHfYCYs']",0,"[179.24029, 269.647752, 11.058099, 97.884612, 698.459332]","[86.045811, 69.014829, 14.939612, 212.788196, 65.581158]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,train-fasttext,5,"['06f0e241-6d28-48e4-bd5f-f9b89cacceaf', '4ccaa0b7-63a0-4c03-84c2-ab8046d5f886', 'f5f6e727-433e-47ca-9ae0-e83a5dc75a34', 'e437a042-2d76-45b7-aa18-78aa7c1a09cc', '895598b7-5163-4e78-b72e-9114e94faeac']","['train-fasttext__yKturZx', 'train-fasttext__RuNZbPM', 'train-fasttext__TcSr2QY', 'train-fasttext__KigQ5zk', 'train-fasttext__H8xbzPz']",0,"[3246.338034, 1980.26789, 1893.742171, 3600.03086, 2501.538762]","[14.936811, 39.05491, 32.666492, 287.371418, 72.146807]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,tune-mjcf,5,"['1bf00f9f-1834-47f5-9cd5-43823df894f9', '60a0eaef-b10b-4181-a28c-2234d2979154', '44a6d18f-41ae-448b-ac70-aa2b98482df2', '6ca3e89f-d062-447f-8984-9d8546740405', '21a45437-c1e3-4b72-b6ba-c4cd2f458c19']","['tune-mjcf__jwewi9i', 'tune-mjcf__ebrDjAU', 'tune-mjcf__TmVj6sJ', 'tune-mjcf__qTgEusH', 'tune-mjcf__QN9xcLd']",0,"[939.710948, 900.099051, 1005.474516, 902.471228, 1046.321196]","[58.886638, 9.695875, 31.717411, 15.076949, 59.536622]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,video-processing,5,"['2735f797-6ff8-4133-b974-3c9b64806e5a', 'da22d103-c125-4b0a-a191-774618359ebc', '973963fd-f94f-415a-b01e-003830f865e5', '57d50c78-45bc-4194-b71c-0c0c639f8783', '031e87ef-51ef-49e5-8992-45ecda232b84']","['video-processing__4FDwQYb', 'video-processing__sHsWzyS', 'video-processing__7a8ZQXr', 'video-processing__u2Mh8zk', 'video-processing__fKJVXMV']",0,"[321.598354, 429.39043, 108.320554, 339.742443, 377.818725]","[84.581475, 79.475146, 13.849977, 78.092277, 58.96035]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,vulnerable-secret,5,"['feb1d26d-3c7c-4a92-b120-5c24f019d2b4', '2b027ad8-265c-4035-ac8e-7715cd96bceb', '9b0e0c0c-2413-4c1c-b0a1-f627d2e7290e', 'a5086497-24b6-4f1f-89f3-f685ebfdb916', '1d75e94e-40ad-4571-8ae4-d65e60c2a718']","['vulnerable-secret__Rm9PWvJ', 'vulnerable-secret__kv5vhmV', 'vulnerable-secret__A4H7c5o', 'vulnerable-secret__QepPkD5', 'vulnerable-secret__b9Ym3gE']",2,"[752.382045, 535.583917, 340.363162, 900.017554, 911.703471]","[48.74125, 10.442896, 13.163447, 145.134735, 22.284451]",0.4,False,"['feb1d26d-3c7c-4a92-b120-5c24f019d2b4', '9b0e0c0c-2413-4c1c-b0a1-f627d2e7290e']" +deepseek-ai/DeepSeek-V3.1,wasm-pipeline,5,"['291a8432-894a-4774-9239-1add40c4f689', 'fc18deba-5397-401a-92cc-72ff6614f77c', 'a8c7dbe8-7902-4f99-a666-1e13c78fde02', 'b7bfafc2-a9ba-4789-bc08-8fca0843559d', '01ba47ef-b52c-4da6-82b9-4793b4f62243']","['wasm-pipeline__FChUEmB', 'wasm-pipeline__UwE55NS', 'wasm-pipeline__LLCpFvU', 'wasm-pipeline__UCRzLdm', 'wasm-pipeline__mCrGLiG']",2,"[1025.70974, 919.386683, 323.960896, 661.050241, 829.860657]","[36.213408, 22.176919, 8.292168, 3.705048, 14.032356]",0.4,False,"['b7bfafc2-a9ba-4789-bc08-8fca0843559d', '01ba47ef-b52c-4da6-82b9-4793b4f62243']" +deepseek-ai/DeepSeek-V3.1,winning-avg-corewars,5,"['ef316108-fd79-4334-97c5-64cd1a5a4141', '3458662c-4385-409d-9a49-9954dba94727', 'e8bd4d79-ab27-433a-9e3b-ec2eee0b6c43', 'a4975c59-a39c-42b0-a418-6de0ad4647ab', '63a03bce-761e-4b8f-86a8-587a34f7098d']","['winning-avg-corewars__AmhjSYv', 'winning-avg-corewars__dRxVWr8', 'winning-avg-corewars__iGmLBhu', 'winning-avg-corewars__QrNKE9T', 'winning-avg-corewars__rMhSTJY']",0,"[851.993879, 1545.868203, 580.508966, 1357.0253, 650.885878]","[4.646628, 54.904056, 4.584661, 20.4221, 52.632463]",0.0,False,[] +deepseek-ai/DeepSeek-V3.1,write-compressor,5,"['02985f59-ddc1-48cd-8403-66aff8fc2126', '3b29e901-6502-4d4c-b0f1-4233f59c9cba', '4bfa8dfe-29ef-405a-802f-2c7b7e7f178a', 'bb1f978f-7401-4b2d-8877-f5734cf24a72', '6e2c0a75-16bd-4296-bc9c-5610f0581d7f']","['write-compressor__feeBwjh', 'write-compressor__iRqUxM3', 'write-compressor__dY9RHhS', 'write-compressor__Dv8b3wu', 'write-compressor__eTc2n2E']",0,"[939.336987, 598.722451, 915.705531, 311.253096, 917.610836]","[285.003803, 111.690104, 54.769621, 22.781663, 103.039203]",0.0,False,[] +gemini-2.5-flash,adaptive-rejection-sampler,5,"['c5319641-bdc5-4564-9cdf-45f510944655', '7efcbc2e-b819-4733-8889-559bd94012cb', 'b0e2f43f-19d6-4412-8a61-da781c456e4d', 'cebc15ff-5382-4b44-a166-ca69347a3ba4', '9eae2eeb-837c-4e28-a30f-7b8e03c71fc3']","['adaptive-rejection-sampler__YBM4MxY', 'adaptive-rejection-sampler__XrDJRqc', 'adaptive-rejection-sampler__37gM5HW', 'adaptive-rejection-sampler__eEgpxe7', 'adaptive-rejection-sampler__ftbxZGU']",0,"[900.559728, 907.473425, 906.827773, 917.145767, 905.959331]","[60.782417, 23.845595, 313.626928, 38.215872, 122.359999]",0.0,False,[] +gemini-2.5-flash,bn-fit-modify,5,"['8a07ec33-5adb-425e-a29b-0341d2090844', 'b19c5622-fbda-49e0-850b-83df83360911', 'c86f2110-37fd-43a2-9bc4-d0259420da96', 'ff50a638-2941-4063-a70e-5fc0e5508c2b', '223908dc-2738-4e5c-a9f0-f38df2118d0e']","['bn-fit-modify__AYJqTqE', 'bn-fit-modify__jhDTWNB', 'bn-fit-modify__ocJpEw6', 'bn-fit-modify__FcHrbnw', 'bn-fit-modify__dEzXjBa']",0,"[3639.357988, 3608.480334, 3600.030334, 3600.651741, 3620.176057]","[63.325802, 186.267151, 96.40357, 43.954421, 245.52279]",0.0,False,[] +gemini-2.5-flash,break-filter-js-from-html,5,"['2e924e64-1325-40a9-9c8d-903d02435aa3', '9842df1a-15f2-4b48-adde-c1283523f546', 'b34aed8e-0c82-4b4e-a774-efb8bf69a22e', '2bdb51b4-7f78-4e61-8138-6f4fc392d3ca', '3acfc990-885b-473e-a139-e3d42adb6c5a']","['break-filter-js-from-html__5LJAaZi', 'break-filter-js-from-html__sRksQeq', 'break-filter-js-from-html__rFtSEkV', 'break-filter-js-from-html__ULRjsLh', 'break-filter-js-from-html__AqcpU3v']",0,"[132.207215, 1203.721666, 127.737458, 119.978262, 135.464199]","[120.747147, 57.715856, 52.210566, 55.488751, 16.232456]",0.0,False,[] +gemini-2.5-flash,build-cython-ext,5,"['d1709980-2236-4d4b-9453-b01217df5aed', '477a1f21-5ce6-4952-b061-3257213448c0', 'ed5dd1f2-c3cd-4031-9f8d-461afecd1352', '965e09ab-6dbb-473b-8e80-1c6a9d50d954', 'aa98cd68-5141-49fe-a4de-cdb3cc8946f3']","['build-cython-ext__GcCdhSp', 'build-cython-ext__Vw72MMy', 'build-cython-ext__wECwchc', 'build-cython-ext__Sq4KPkr', 'build-cython-ext__HMu2hNW']",0,"[633.901747, 928.748796, 900.239173, 906.126771, 1017.33654]","[98.339004, 44.498991, 8.318928, 243.770037, 117.317887]",0.0,False,[] +gemini-2.5-flash,build-initramfs-qemu,5,"['22df531f-bf24-4f6d-bc7b-b010873ab465', 'be3618de-a0c0-4a68-b4e9-0a4309c9e10b', 'd1563f30-58e4-472c-8888-d9dde2c6ecb3', '03c00b2b-cd16-4db1-b0f7-ff5c0b64853b', '311e767d-a2f7-408a-95e2-21b355cbc10a']","['build-initramfs-qemu__Tm2urqE', 'build-initramfs-qemu__nLsK24v', 'build-initramfs-qemu__gf8x6Y9', 'build-initramfs-qemu__dufKLLm', 'build-initramfs-qemu__xU58aWQ']",0,"[902.21007, 136.46695, 315.570178, 382.629468, 276.387594]","[13.934329, 68.520359, 46.6688, 80.675271, 103.414873]",0.0,False,[] +gemini-2.5-flash,build-pmars,5,"['fb88a68e-8936-4759-8ad6-58b5cd07cd59', '06150deb-40ab-4945-a75a-8868751e998b', '85c0ff26-265a-4210-b780-bb3db15ff8ea', '3c3d3ffa-5e36-48c5-bfaf-7f9e311e7db0', '5de0f073-202b-4bb1-81a2-d2922e1f60ab']","['build-pmars__rrU6Xoy', 'build-pmars__zsLF2qn', 'build-pmars__TKhm3ev', 'build-pmars__cn8hUGi', 'build-pmars__YwZ3Pzr']",4,"[526.52064, 297.764865, 271.468212, 533.871312, 907.796197]","[11.908383, 4.73089, 4.746846, 35.823524, 8.1741]",0.8,True,"['fb88a68e-8936-4759-8ad6-58b5cd07cd59', '06150deb-40ab-4945-a75a-8868751e998b', '85c0ff26-265a-4210-b780-bb3db15ff8ea', '3c3d3ffa-5e36-48c5-bfaf-7f9e311e7db0']" +gemini-2.5-flash,build-pov-ray,5,"['e2647158-ab74-4739-9e45-7eac69decfdc', 'a15d21ff-d07f-45c6-a446-c82bb92fb37b', '02a750d9-a393-4f5d-a578-29d0f56611df', '3d9e25c2-33b9-459f-a20c-ed3e951a6e5e', '7734c321-1804-4408-b076-2e15f9504101']","['build-pov-ray__HF7yKcN', 'build-pov-ray__wGnE5xA', 'build-pov-ray__WP2eMDC', 'build-pov-ray__KUfuej7', 'build-pov-ray__evywaXp']",0,"[1089.011571, 1283.197018, 5622.761483, 786.053583, 6000.193284]","[42.235129, 75.690217, 33.078001, 42.329369, 54.967231]",0.0,False,[] +gemini-2.5-flash,cancel-async-tasks,5,"['2e2bbce6-92ad-40fc-afd3-6c8d99e937bd', '2a545337-3758-4fba-9002-a02d342df170', '24daaac1-2943-4906-b792-3e7994ffc378', '455235f9-312f-467c-9838-c24a11a152eb', '4737bd65-f497-4f4f-9586-e30c92d25d55']","['cancel-async-tasks__ktPsmaN', 'cancel-async-tasks__FsPo9Rj', 'cancel-async-tasks__VTTAd9Q', 'cancel-async-tasks__ficDoYe', 'cancel-async-tasks__n57NS7o']",1,"[684.612171, 86.1771, 300.163772, 160.217778, 111.386539]","[37.560738, 14.018986, 203.801996, 43.864042, 103.429916]",0.2,False,['4737bd65-f497-4f4f-9586-e30c92d25d55'] +gemini-2.5-flash,chess-best-move,5,"['c4d6605e-a3ad-4d4e-b910-87b7e4a27052', '1f55ccc5-6b4a-405b-88eb-cd12d07484a6', '7bdef584-b684-48a4-929e-e59bd6e7b804', 'e8566611-72b9-42d3-abc8-c97a9e87451a', 'f83fb955-0a19-441c-8343-d723811ecf42']","['chess-best-move__gfStHcj', 'chess-best-move__NXBRuDi', 'chess-best-move__6NvKzEn', 'chess-best-move__WH4Yn58', 'chess-best-move__sk3mZXz']",0,"[627.610071, 653.378282, 694.564034, 900.511685, 907.158475]","[211.135535, 69.41541, 23.038904, 7.714497, 24.338223]",0.0,False,[] +gemini-2.5-flash,circuit-fibsqrt,5,"['5db2f59e-165f-4634-82d7-fec45a0a9bcf', 'a0982491-253e-488f-9e63-cd1163e81581', '81e97aca-9980-4470-ad77-a7032a80b237', 'cfed86a5-f3cd-43a6-9098-4cb5001731bd', '3fb70c5d-603d-4a56-9544-1fa6e86acb49']","['circuit-fibsqrt__n9jcbEc', 'circuit-fibsqrt__VTBw5GN', 'circuit-fibsqrt__iycZSi9', 'circuit-fibsqrt__TEViipW', 'circuit-fibsqrt__TWgJE7F']",0,"[3600.288436, 3605.968766, 3287.977055, 3600.086186, 3605.343807]","[66.340644, 28.223493, 28.881926, 17.068837, 14.203205]",0.0,False,[] +gemini-2.5-flash,cobol-modernization,5,"['49eea92a-499a-403b-a601-f3925dd97902', 'ba97c69f-8d65-406c-af0c-3628817ed782', 'af9d300f-272e-4492-b156-80bf6a2f5210', '44084ffe-ea1e-43a8-a734-6dc402078c66', 'd774b13d-faa4-4d06-80c3-755b99d54104']","['cobol-modernization__aVrGS9m', 'cobol-modernization__35SDnKJ', 'cobol-modernization__7xWMZMF', 'cobol-modernization__U93J6o6', 'cobol-modernization__id3bLZM']",1,"[914.479715, 933.830954, 174.45787, 553.277356, 900.71718]","[54.660502, 81.033376, 43.739164, 59.996166, 64.177152]",0.2,False,['44084ffe-ea1e-43a8-a734-6dc402078c66'] +gemini-2.5-flash,code-from-image,5,"['de054569-f5c4-4dca-b603-d3982af0c590', 'bbcf0ba5-3373-4084-9473-1af7971155d4', '986fdea7-2ccf-45aa-845e-47b004b01fbe', '07713ad8-d4e0-4a7d-bfa9-ecc24dc5c356', '4203ab45-55b1-4d42-a5c8-a1cae86b628f']","['code-from-image__VEYdSxW', 'code-from-image__NTua9CM', 'code-from-image__NJLchW6', 'code-from-image__tYWHqnD', 'code-from-image__uNLZXBw']",2,"[157.591857, 175.876213, 279.361533, 1200.001559, 355.965274]","[25.54709, 20.651542, 13.972023, 74.234841, 80.605723]",0.4,False,"['bbcf0ba5-3373-4084-9473-1af7971155d4', '4203ab45-55b1-4d42-a5c8-a1cae86b628f']" +gemini-2.5-flash,configure-git-webserver,5,"['fa24fa9b-a773-4b3b-8488-c22d34301de8', '3433962e-d8b6-47c9-b107-27c9d4903e31', 'b7d75e8f-c633-4f53-98d9-e27efa6b0f9e', '55989932-54ad-4b20-bc1a-cb12e52bbac5', '3184d1fb-d2ea-420d-bf73-c4756dc26155']","['configure-git-webserver__BpFvC6B', 'configure-git-webserver__JFTQAZb', 'configure-git-webserver__WhVpZCo', 'configure-git-webserver__w38apyy', 'configure-git-webserver__HZ3ycro']",0,"[144.130926, 493.917429, 437.069834, 215.560349, 405.264032]","[27.996955, 29.067198, 65.016011, 59.096914, 77.595234]",0.0,False,[] +gemini-2.5-flash,constraints-scheduling,5,"['3b0cee7f-69dd-461c-8b31-5703dda6931c', 'd2e9a14d-4ba2-46a7-bff2-cc494246c169', '1e021ab3-4b9f-4499-bba0-935090590c39', '5ecf2fc0-3c49-44b6-9e73-dbaed520130d', 'f49d58a7-dcd5-4f7c-b363-57e7c4bf5ee3']","['constraints-scheduling__Hce9LhJ', 'constraints-scheduling__qZEBCxH', 'constraints-scheduling__XyjRjy9', 'constraints-scheduling__25w9N3n', 'constraints-scheduling__6y5hHoX']",2,"[386.337337, 1211.78287, 446.132755, 492.901699, 130.979526]","[144.97702, 72.691176, 45.254949, 12.131559, 13.828476]",0.4,False,"['d2e9a14d-4ba2-46a7-bff2-cc494246c169', 'f49d58a7-dcd5-4f7c-b363-57e7c4bf5ee3']" +gemini-2.5-flash,count-dataset-tokens,5,"['79545fd6-fa00-4dbb-9309-639a5af908da', 'c132e1d5-f324-44eb-b955-54d601713052', '422efa4f-9373-49fd-8fc3-304fc208bda5', 'f51a4346-8c17-499d-8c43-51d22aac2fd5', '4eb1ef79-211b-4759-bada-10520d7582f4']","['count-dataset-tokens__BMEa94R', 'count-dataset-tokens__iQTwjU3', 'count-dataset-tokens__M59qG2q', 'count-dataset-tokens__dusk5rT', 'count-dataset-tokens__ixpbyAW']",0,"[369.28612, 303.303175, 662.968065, 386.547217, 912.516773]","[26.446408, 40.827368, 16.246015, 32.49734, 15.387671]",0.0,False,[] +gemini-2.5-flash,crack-7z-hash,5,"['b12512ca-5ec4-4f1c-849a-16e15eee4ee2', '90195fc4-abd2-4ba3-8b83-4455e623e9d4', 'c0ea14c1-d2f2-4cb3-bf51-1ee91c6dd330', 'f23c0e44-c9ff-4ec5-81b7-cb98e4f67cba', '7242fe82-1dcb-4237-885d-e03b24c74654']","['crack-7z-hash__3t9CD6Y', 'crack-7z-hash__VW4Bd6S', 'crack-7z-hash__AqU6YsJ', 'crack-7z-hash__XrPju6z', 'crack-7z-hash__NPhdasu']",4,"[605.059823, 556.26839, 327.482622, 792.182081, 238.596896]","[26.411972, 18.326137, 30.584362, 43.375939, 11.673864]",0.8,True,"['90195fc4-abd2-4ba3-8b83-4455e623e9d4', 'c0ea14c1-d2f2-4cb3-bf51-1ee91c6dd330', 'f23c0e44-c9ff-4ec5-81b7-cb98e4f67cba', '7242fe82-1dcb-4237-885d-e03b24c74654']" +gemini-2.5-flash,db-wal-recovery,5,"['86c503f7-e52c-4968-9a1e-522a65e56d3a', 'a30ddbad-c58c-4740-9f6d-1bd05f10734f', '458baed0-2b9d-4a50-97cf-f5c4261ce38e', 'b48883c5-a60a-4eb0-83e5-2010edbeb4c6', '2f3f2560-34ef-4277-97af-b49f16738bd8']","['db-wal-recovery__ibwiofR', 'db-wal-recovery__qhR8Z7w', 'db-wal-recovery__McyDecT', 'db-wal-recovery__WrWzLeB', 'db-wal-recovery__6Q3Rvu3']",0,"[904.015827, 900.048317, 332.896125, 965.916599, 907.301296]","[25.220048, 13.469561, 29.739336, 78.804879, 12.808702]",0.0,False,[] +gemini-2.5-flash,distribution-search,5,"['fd2c08e5-c249-4ed7-ae2f-47315c6831c3', '1f8d1ebd-1a70-4a76-ab8a-53c91ac2ad7f', '0edb7b99-353c-46c4-a818-5eff90d1df83', 'ab4aeaa7-e721-4f7b-bbc2-23f1c82a79de', '4b17eecb-0f5f-405a-87a8-d3d9f5d254ed']","['distribution-search__v3fbfXi', 'distribution-search__XaxUDQR', 'distribution-search__qyM4X6A', 'distribution-search__8bTwPH6', 'distribution-search__5wHrCZR']",0,"[1122.881936, 3600.560965, 3600.053689, 2288.844989, 3603.911274]","[24.426557, 37.566602, 28.574105, 48.373878, 155.016906]",0.0,False,[] +gemini-2.5-flash,dna-assembly,5,"['a7f11ae4-baec-4d2d-a80d-0d88afbac197', '8ef8fa0d-989d-45b0-a3f5-4b1a1a3eabcf', 'e84f9480-c3bf-44bc-abc6-fcd83b7d9366', '09096bf7-c0db-47c7-ac0c-956e1ed86948', '4d1fc036-a982-4957-a335-fa14a1b685ec']","['dna-assembly__JHwpaRV', 'dna-assembly__ZWSrkwP', 'dna-assembly__WzfpBYN', 'dna-assembly__iDxMVyh', 'dna-assembly__pgM5HCC']",0,"[738.785815, 337.615446, 730.423479, 759.453596, 746.757306]","[38.987549, 19.636748, 55.747543, 176.772716, 23.194353]",0.0,False,[] +gemini-2.5-flash,dna-insert,5,"['e44cf683-bc75-4d8b-8af8-878d6cdf9e1a', 'e5fa7fe4-5449-41be-b98f-4cd16b03b822', 'efef8e61-e0b6-47d5-9fd6-e906cf9f8d5e', '53e4ab75-260d-4300-afc6-93a74d677755', '3a94e965-6fa6-4572-970c-102b67228bba']","['dna-insert__7PGLnCq', 'dna-insert__AP5ANc2', 'dna-insert__dBHyRxf', 'dna-insert__hM6qwTa', 'dna-insert__3jquKrg']",0,"[384.723377, 360.961252, 366.968483, 396.535286, 628.360897]","[38.392063, 25.640102, 30.770844, 29.468698, 305.812811]",0.0,False,[] +gemini-2.5-flash,extract-elf,5,"['06915318-5cc7-450a-a044-5bb02368200d', 'be77ee40-b5f7-417c-92dc-e32ca9ca0154', 'bcddc2e8-f2d5-4d57-a543-d4c133c811e5', '51398805-a475-431c-b400-1826c0acf5f1', '4c43f87a-b358-47e7-8530-b94836e99819']","['extract-elf__joBU25p', 'extract-elf__XmxKmsi', 'extract-elf__G9dPFqH', 'extract-elf__YrTkkn5', 'extract-elf__6tcQgvs']",2,"[164.870108, 541.481969, 636.028645, 203.397886, 117.742669]","[21.213209, 159.903966, 82.132503, 22.589688, 76.620433]",0.4,False,"['06915318-5cc7-450a-a044-5bb02368200d', 'bcddc2e8-f2d5-4d57-a543-d4c133c811e5']" +gemini-2.5-flash,feal-differential-cryptanalysis,5,"['c9511fbf-837e-44cf-98ef-e01227d81b1f', 'ba2a9cc4-23bc-4476-886f-9e5fd5327577', 'e4cb414c-e754-4e3d-82cf-23616d20a6dc', '32752537-4bb3-485b-acd0-f7f04d7b476f', 'ba5ef0d0-e8f9-4a83-85ff-aade6ba0db51']","['feal-differential-cryptanalysis__CTEU9Fh', 'feal-differential-cryptanalysis__nGziPeT', 'feal-differential-cryptanalysis__7ufwkpT', 'feal-differential-cryptanalysis__Wd8Qc6T', 'feal-differential-cryptanalysis__NCmYqiE']",1,"[335.795619, 431.355964, 273.586965, 1803.341612, 290.39154]","[211.922723, 80.28214, 28.667402, 80.352624, 246.025428]",0.2,False,['c9511fbf-837e-44cf-98ef-e01227d81b1f'] +gemini-2.5-flash,feal-linear-cryptanalysis,5,"['d82801ba-982d-453a-93f1-1638700e8aa1', 'e7a54e35-e1c6-4406-9a95-252b8c60f21b', '8d53738e-78fa-40a4-a012-104d00581289', '2df4eb12-2067-456e-a26f-da04b97a0445', '302db4c2-6813-490a-9546-a2cb644b3cc7']","['feal-linear-cryptanalysis__9Rxytd5', 'feal-linear-cryptanalysis__Fq3vRDh', 'feal-linear-cryptanalysis__mb2FUwN', 'feal-linear-cryptanalysis__zweZB8G', 'feal-linear-cryptanalysis__WdAUPju']",0,"[1811.558613, 408.574574, 1828.375895, 657.466154, 1800.879325]","[154.433019, 101.736628, 65.211543, 28.463714, 24.433688]",0.0,False,[] +gemini-2.5-flash,filter-js-from-html,5,"['a8c47109-9595-4109-a8b0-ba1fb8bd3f47', '86fde7dd-f8b4-4551-8c4a-ca07e17eead1', '9a169b9a-0014-4d0f-bf94-17e4a4da08cd', '0a7f9ad3-831b-4a14-8f78-33ea4e35e2b1', '7ba63556-9ba8-4932-95ac-296dce71b609']","['filter-js-from-html__EbT2wbD', 'filter-js-from-html__asaJEBt', 'filter-js-from-html__vCuDXVE', 'filter-js-from-html__g5p3G5R', 'filter-js-from-html__rvzsubg']",0,"[900.006478, 912.106816, 406.952729, 210.840016, 900.016529]","[77.961316, 77.912132, 55.453526, 51.260574, 44.359717]",0.0,False,[] +gemini-2.5-flash,financial-document-processor,5,"['800d390a-d43c-4908-8946-44bd5f7d9c7d', '1b0a2cc5-d2e5-46c6-bfa2-c4f63d43072d', 'c31cfdd1-602e-4a34-b8e8-822820d3e96e', 'c335124e-6426-47cb-9c63-39b9c66da73c', '23c9be1f-303c-4779-b2e0-2a989702f0fe']","['financial-document-processor__M53X3c6', 'financial-document-processor__3reZ9dQ', 'financial-document-processor__A5jhBbH', 'financial-document-processor__VzMx5F9', 'financial-document-processor__R9wx7E8']",0,"[1217.995469, 1203.330971, 129.254561, 1172.18605, 496.266184]","[65.74927, 133.466877, 21.263597, 28.852528, 247.50332]",0.0,False,[] +gemini-2.5-flash,fix-code-vulnerability,5,"['ed2e77eb-5a57-4158-b278-dd2a70896713', '0e5549d3-3346-4946-9b1c-b82839b84a22', '036e9923-884f-4dab-82bb-b9d46375bee3', '31092841-cbf3-4b2a-9d67-b83c6529933b', '2f0b151f-66dc-4251-bb94-24a1f84fa4d1']","['fix-code-vulnerability__LgeT79x', 'fix-code-vulnerability__5wwSgqT', 'fix-code-vulnerability__KtMmizr', 'fix-code-vulnerability__JpCUtTD', 'fix-code-vulnerability__oXvhag2']",0,"[904.470365, 900.057884, 900.15045, 949.079368, 805.724129]","[49.082975, 42.646346, 3.448504, 4.716597, 8.622677]",0.0,False,[] +gemini-2.5-flash,fix-git,5,"['9468c801-e77b-476d-9e56-c7618c84dd59', 'a0e28d61-75b6-4342-9394-261bbdeafce2', '6214e46a-4b19-4ce0-8fe2-9c7fa20366ca', '5693b834-6e6f-4009-9265-694e90b6ae80', '1ca88d95-8d7a-42b6-b3fe-1c68146b3437']","['fix-git__Nhvcd4j', 'fix-git__thfbf2x', 'fix-git__vG74g4d', 'fix-git__eaxJFh9', 'fix-git__JyeqKmf']",4,"[80.054881, 190.960504, 120.301791, 137.661949, 202.258595]","[21.389023, 38.267719, 48.419115, 17.992957, 33.370241]",0.8,True,"['9468c801-e77b-476d-9e56-c7618c84dd59', 'a0e28d61-75b6-4342-9394-261bbdeafce2', '6214e46a-4b19-4ce0-8fe2-9c7fa20366ca', '1ca88d95-8d7a-42b6-b3fe-1c68146b3437']" +gemini-2.5-flash,fix-ocaml-gc,5,"['f7ce9acf-1cf6-4572-8703-d60472b19b0e', '803c1e68-4163-4e0b-97e2-5ef7f7023c76', 'a961976c-4b1d-47ce-94b6-60c5aa5f2359', '5e79216e-c42a-4949-9f33-65582bed2132', '3a6c3eb0-95dc-4360-8a2b-5c704d3f01d3']","['fix-ocaml-gc__X5nXeHm', 'fix-ocaml-gc__gh9Bv46', 'fix-ocaml-gc__5Nydp74', 'fix-ocaml-gc__noL4AXM', 'fix-ocaml-gc__ptcMDWc']",0,"[3600.024888, 3600.001254, 3600.488881, 3600.002398, 3612.833067]","[22.371869, 168.245253, 45.049371, 31.853779, 123.555185]",0.0,False,[] +gemini-2.5-flash,form-filling,5,"['998fe7e9-864b-4b9a-a5cc-fb570d96ea14', 'a72353b9-8e9e-4429-a162-4a881f617712', '614a8383-5b89-412d-8883-8f8ec2b340ed', '5e318720-a337-45a0-84ab-c68b187d81b7', 'd78c2f30-c4d2-4eac-bf8e-2ed0a1883628']","['form-filling__YDchwpD', 'form-filling__eyTwoLe', 'form-filling__moyoTeJ', 'form-filling__JpS3NBn', 'form-filling__vqYS9pT']",0,"[912.370358, 901.56128, 903.93215, 417.453321, 909.09964]","[9.287846, 9.141205, 17.768144, 4.796334, 14.799765]",0.0,False,[] +gemini-2.5-flash,git-leak-recovery,5,"['696ebfe5-84c3-4be8-a817-a71ca527e29f', '136f4164-95d3-477b-9baf-e01a4459b77c', '874e3c23-a45e-4e2f-aff6-dc76926431ee', '48de3f9d-ad90-4ce2-9e83-49b9fa08e635', 'd29570e7-ac70-457a-b457-122d9963dad6']","['git-leak-recovery__H9xMWqk', 'git-leak-recovery__bzD42Sn', 'git-leak-recovery__sPxpELC', 'git-leak-recovery__nC2sx93', 'git-leak-recovery__fuoDnpr']",3,"[678.939516, 131.339016, 274.338204, 127.800433, 525.141885]","[50.403044, 26.400828, 29.999683, 180.891809, 107.936376]",0.6,True,"['696ebfe5-84c3-4be8-a817-a71ca527e29f', '874e3c23-a45e-4e2f-aff6-dc76926431ee', 'd29570e7-ac70-457a-b457-122d9963dad6']" +gemini-2.5-flash,gpt2-codegolf,5,"['0a48e58a-60e1-427d-8751-98eae75a539d', '5b83c9c7-c005-4a95-89be-846ae500efc3', '2442eec9-28bf-4b5f-9032-3db54b84e24b', '8be099ba-c0ed-49a9-ad52-e0985226337b', '56f114d0-aae4-45b0-87eb-73e6b3221e4e']","['gpt2-codegolf__2kQzrti', 'gpt2-codegolf__nH9ScTG', 'gpt2-codegolf__VD3xud9', 'gpt2-codegolf__ALZGFcp', 'gpt2-codegolf__kSpwKfm']",0,"[386.891306, 96.970774, 563.656472, 219.296895, 96.722721]","[186.957828, 340.706301, 23.998783, 140.82034, 51.916919]",0.0,False,[] +gemini-2.5-flash,hf-model-inference,5,"['cd492866-5608-40c9-86d0-0cb7fa6682df', '8729d83e-2e4c-47af-9e5e-6af1b56cdce6', '8e527883-3aea-4182-89af-29ef15c567a3', 'faa263f1-85a8-4abe-8d2f-e2f6068fbd3d', '34855aac-e62a-4db5-aec5-c1d9f4ae13d4']","['hf-model-inference__MLSfdtY', 'hf-model-inference__ejESFwr', 'hf-model-inference__BUWYP3r', 'hf-model-inference__Vw9nSXG', 'hf-model-inference__teGp9Ro']",3,"[80.987162, 200.120874, 254.420101, 153.094486, 342.702249]","[14.709214, 51.050459, 171.590415, 63.251393, 25.036004]",0.6,True,"['8e527883-3aea-4182-89af-29ef15c567a3', 'faa263f1-85a8-4abe-8d2f-e2f6068fbd3d', '34855aac-e62a-4db5-aec5-c1d9f4ae13d4']" +gemini-2.5-flash,install-klee-minimal,5,"['d99c5e9b-5ae4-4eb9-a4ca-85bbb5a843ed', 'ad43c031-dbd6-4417-9e16-15c74eb7cd02', '1737acd6-bc8f-4704-ba36-ab214e8bc851', '531a69fd-6fd5-4be4-93f4-5b947121cf1e', '19382d53-a43c-45af-a7e2-20425ce1b2cd']","['install-klee-minimal__D4h8Ujq', 'install-klee-minimal__Av5p4Gq', 'install-klee-minimal__dwTUupG', 'install-klee-minimal__zZ5yPUG', 'install-klee-minimal__oAepeFH']",0,"[900.076384, 906.371958, 900.065827, 900.124814, 900.155278]","[89.480728, 69.064106, 64.527766, 94.750448, 111.417938]",0.0,False,[] +gemini-2.5-flash,install-windows-3.11,5,"['cf28343f-8e72-46de-a10c-71f2af7e5b44', '209a3ce1-a607-4779-8105-5a2a8f03f55d', '32cfe257-a021-422c-9268-133e1757e04c', '3f6bff5b-608c-4ef4-8f5b-701c1eacc719', 'e8552904-cc24-4377-9cf9-732b5db09d74']","['install-windows-3.11__qmU3u6D', 'install-windows-3.11__TRc68LW', 'install-windows-3.11__dMphRJV', 'install-windows-3.11__WpzCZgN', 'install-windows-3.11__iHKmxkZ']",0,"[127.662313, 113.706274, 328.857361, 254.501894, 1228.322464]","[18.701237, 26.238416, 35.797068, 20.208466, 39.659352]",0.0,False,[] +gemini-2.5-flash,large-scale-text-editing,5,"['3634b51d-f88c-4f37-b842-8249692cb8c7', 'b2788058-e06c-4526-b055-4998d1f9ae33', 'd5b34d69-68b6-4144-93c4-d20890f88e84', 'a2281df0-d2df-43cf-8537-04b70c6ed2d1', '3c45ac9c-e7a5-4b8e-98f9-8a5861ef26ec']","['large-scale-text-editing__ADKGAm9', 'large-scale-text-editing__8WBJV5g', 'large-scale-text-editing__RbMf6dz', 'large-scale-text-editing__JxwhptG', 'large-scale-text-editing__pLTGvRo']",0,"[243.565163, 352.885575, 203.000537, 109.534043, 241.052288]","[230.218167, 321.281667, 18.210826, 20.045703, 89.546011]",0.0,False,[] +gemini-2.5-flash,largest-eigenval,5,"['09eb55ed-67d8-4a4b-bc05-8d0ab7932fdd', '24250723-f08e-4070-9f23-c14d7665eb57', 'a2e17e65-5d9b-45cc-9cbc-e9f79b1de82f', '0bd8e410-1d71-4e28-a1d3-40ea9b9a3567', 'c0c8c7e6-7da2-4b5c-9a88-e71423700e72']","['largest-eigenval__efbf8gs', 'largest-eigenval__gvafePp', 'largest-eigenval__ZB9DLLe', 'largest-eigenval__hUzfPAB', 'largest-eigenval__coRVz2t']",0,"[927.189793, 908.270288, 908.089323, 900.235319, 900.406137]","[305.435071, 42.799981, 56.172087, 37.105714, 43.1243]",0.0,False,[] +gemini-2.5-flash,log-summary-date-ranges,5,"['d175e902-714d-4be9-b80f-2a8bc23e3787', '7bceb0f5-9dbd-4804-a5b0-4887835d8af8', '5734640c-6cbb-457d-b62d-8c4798eb87be', 'e32e39ef-8b5f-44f0-a7c7-b3909cb7dde8', '774fb23d-079f-4374-a253-eed5275fe36b']","['log-summary-date-ranges__PswhCuL', 'log-summary-date-ranges__fpscuGs', 'log-summary-date-ranges__JuAu3oo', 'log-summary-date-ranges__ES9xfrM', 'log-summary-date-ranges__gQXrWEp']",0,"[214.425678, 251.721092, 171.118966, 210.464959, 70.699959]","[67.797593, 163.841929, 78.572897, 71.724326, 33.141748]",0.0,False,[] +gemini-2.5-flash,make-doom-for-mips,5,"['51779134-2afb-415c-aabb-bac628bd3e81', '1bde948b-4128-4100-9baf-08bdc84b8be2', 'a13e771c-3d30-41a6-b50e-ee754018657c', '86934fd0-337b-47b4-9004-ed4041dcb44a', '26971107-e1da-4865-b2cd-3f2a0d3adb91']","['make-doom-for-mips__eY5TVjP', 'make-doom-for-mips__pAJHZzr', 'make-doom-for-mips__LXNyVvq', 'make-doom-for-mips__B8qBoUg', 'make-doom-for-mips__iDXGURH']",0,"[728.76104, 910.993634, 236.206561, 900.553414, 915.855123]","[94.665662, 30.826496, 34.185028, 124.670827, 23.032034]",0.0,False,[] +gemini-2.5-flash,make-mips-interpreter,5,"['53fbbe87-b97e-4c9f-9593-ff96a1d4ad89', '85d65925-9c3c-405b-a8fc-8c40e6c2ab52', 'de14bcba-3abd-4a85-9015-5f558009014b', 'f050894e-2717-4831-9cd8-09d9d7fcf54b', '50549937-d8ca-423d-8be6-f4c5aef66fd9']","['make-mips-interpreter__da2h3CX', 'make-mips-interpreter__uvWV98r', 'make-mips-interpreter__NFKDNcu', 'make-mips-interpreter__xC4PKTF', 'make-mips-interpreter__XeYkeJ5']",0,"[1814.779469, 1800.722235, 1800.612837, 2074.266498, 1817.152785]","[203.713337, 89.524326, 98.20127, 11.038934, 241.459774]",0.0,False,[] +gemini-2.5-flash,merge-diff-arc-agi-task,5,"['dcbf2602-8b4b-4bda-a165-cdeaa56bf48f', '6cb366ea-282c-4b5b-a7e0-b0df094dab48', 'bb446a9f-a960-4737-b8d6-6728783efad9', '1edc117a-b336-485a-908c-23b45aa6802f', '0717b99f-9080-436a-b518-d32c2d0d77d0']","['merge-diff-arc-agi-task__eyp2qw4', 'merge-diff-arc-agi-task__b3yJKsr', 'merge-diff-arc-agi-task__XCEDt8r', 'merge-diff-arc-agi-task__WBezNpB', 'merge-diff-arc-agi-task__2ciHtAN']",0,"[593.534303, 908.598271, 912.572668, 900.054173, 905.608288]","[25.142485, 113.661502, 73.330724, 19.757302, 149.95717]",0.0,False,[] +gemini-2.5-flash,model-extraction-relu-logits,5,"['b95070cc-959e-4171-b2a5-328186e6d775', '17474b49-b197-4cd7-ad39-1cfb51b5b867', '98cfd85b-4705-4b86-b069-39da3b5dfaf3', 'a0584ffb-489b-4a7d-8173-fd06e52e58a3', '91d7ff78-9e8b-4bb6-be03-77ba1f88d54d']","['model-extraction-relu-logits__ihb5Kak', 'model-extraction-relu-logits__o4yaegV', 'model-extraction-relu-logits__J9gqytd', 'model-extraction-relu-logits__QEUTs72', 'model-extraction-relu-logits__S6Wuxp4']",1,"[202.07906, 900.415638, 904.734862, 233.88401, 579.314233]","[98.1677, 216.754179, 25.830032, 47.636816, 35.00838]",0.2,False,['98cfd85b-4705-4b86-b069-39da3b5dfaf3'] +gemini-2.5-flash,mteb-leaderboard,5,"['89a1c6ab-7123-4a5c-9532-a75973c98d28', 'cd91bf5f-b311-4160-a9ae-63982c217631', '8c3d5cd8-aac7-4e83-9b54-944eba57d818', 'e14de55c-b8f0-4fb5-8f14-f1587bbb00da', '380f007c-66c4-4d41-bc98-e4c30ead6385']","['mteb-leaderboard__LgDeieo', 'mteb-leaderboard__6rxErwU', 'mteb-leaderboard__4kHW7iB', 'mteb-leaderboard__s2vJpFH', 'mteb-leaderboard__5KJzUmx']",0,"[100.554383, 327.728106, 78.655178, 163.401351, 35.149628]","[82.483473, 8.929297, 26.921246, 32.356473, 2.103791]",0.0,False,[] +gemini-2.5-flash,mteb-retrieve,5,"['1b8d5412-2245-4426-8e18-b282f7f51905', 'a96d27af-d2b1-452c-9fcb-b0139e76c7ea', '038cc009-23e9-4b09-931b-ee8d35985188', 'c901c141-be15-477b-90d4-938d0b4e7323', 'db3d4068-02d0-4976-824b-0fc251c20940']","['mteb-retrieve__dHaGi47', 'mteb-retrieve__LTXafLz', 'mteb-retrieve__KauNEJm', 'mteb-retrieve__zAsbN2G', 'mteb-retrieve__sXXXExM']",0,"[397.667136, 229.928467, 92.911694, 171.517033, 125.761679]","[21.569039, 36.72508, 11.993864, 23.242928, 72.503998]",0.0,False,[] +gemini-2.5-flash,nginx-request-logging,5,"['6d21b2e1-3b18-4728-a7df-9fc83f20760c', 'e7db87ce-d6f7-4932-9f01-6f1dc5210108', '91aebae0-0889-4e7c-b509-59d9dd0a837d', '06265101-16a5-4857-9202-ecf3934fec1e', 'e749f863-648d-454a-9b65-6e91bd21b961']","['nginx-request-logging__XFQRqBy', 'nginx-request-logging__HcUm9Hf', 'nginx-request-logging__VLn9a7D', 'nginx-request-logging__oFZGtEA', 'nginx-request-logging__DPwd4jE']",0,"[226.678299, 923.493182, 79.144991, 900.089541, 55.245023]","[33.983019, 87.52412, 32.120845, 172.446243, 18.988753]",0.0,False,[] +gemini-2.5-flash,openssl-selfsigned-cert,5,"['15a16daa-0e26-4476-a624-60b230504850', '76e1a9b1-2efb-4747-89e7-ff252702bcf9', 'dcfd5012-3732-4bad-ae3f-bb9b15aa4d0d', '84c9fd73-fc0e-4aad-ace9-3c4a7c491674', 'a5671ed3-abda-46b2-a381-b0c600ce9d2a']","['openssl-selfsigned-cert__LAQYaq9', 'openssl-selfsigned-cert__yWRCRYB', 'openssl-selfsigned-cert__847Peeu', 'openssl-selfsigned-cert__RyQ6Xnx', 'openssl-selfsigned-cert__C2WfNAw']",0,"[189.281763, 71.064142, 96.088008, 161.431979, 205.537988]","[47.67, 17.202963, 30.154963, 44.916098, 37.727915]",0.0,False,[] +gemini-2.5-flash,password-recovery,5,"['b7db7a19-6ff8-444b-adb0-43c7f555ac70', '230a3ee5-9a5d-4e90-aa54-3677f3dd4904', '37eb3b9c-c908-48ed-9ed6-295e94dc022c', 'b4d29457-fa80-4b77-80e9-3d24f20b1deb', '7720dd5c-786d-446a-a3e7-c68b68d46b98']","['password-recovery__jWJonYw', 'password-recovery__uaQU2pu', 'password-recovery__2fHN7k3', 'password-recovery__UTNoBcn', 'password-recovery__9QVwnNt']",0,"[1325.439506, 900.081882, 900.023634, 674.968792, 904.2988]","[339.738045, 37.113749, 61.727362, 21.601889, 38.723155]",0.0,False,[] +gemini-2.5-flash,path-tracing,5,"['9e91b193-0a4d-43b1-879c-101a4c003b74', 'bc631276-1e87-44dd-a178-5424cd80fac1', '400e8377-a400-41c1-b54c-bd2768af7556', 'e16faf66-75d5-4309-b8d8-3741e7002606', '366ae9a2-490f-4c39-a2a0-96addccc4369']","['path-tracing__FHQ9dd9', 'path-tracing__rAvxM7Q', 'path-tracing__eNCp2kN', 'path-tracing__tYivztC', 'path-tracing__NzzYCqX']",0,"[604.98068, 1544.269619, 346.891061, 273.498202, 193.685318]","[15.978642, 326.312808, 81.33427, 28.286075, 63.801193]",0.0,False,[] +gemini-2.5-flash,path-tracing-reverse,4,"['2b942958-a411-4a13-bdec-767ced7a9a7f', '62df704f-1020-404d-a9d6-e2f27ce0c402', 'e5412bfd-92a1-4748-a489-1e2f03a34940', 'b3e1734d-044b-432b-b8ef-8cfcb4f2b212']","['path-tracing-reverse__Msaw38M', 'path-tracing-reverse__g9AtxDL', 'path-tracing-reverse__Fum33r4', 'path-tracing-reverse__d3qCKD4']",0,"[1800.932954, 1816.031548, 1143.986856, 1239.350293]","[21.350405, 38.445047, 21.240347, 89.670827]",0.0,False,[] +gemini-2.5-flash,polyglot-c-py,5,"['1ae5f9d3-733a-4930-a440-b86338c76a50', 'ce5acadf-52ac-46f1-9156-4e97bab3f8d5', '6a76852c-afc2-46be-9bbd-cac5c6e07fdd', 'cbcfc0b2-a823-4494-83fe-0902c4f62955', 'f5e3b5a9-ec3b-46a3-8afe-758653c44ada']","['polyglot-c-py__f2YnuPr', 'polyglot-c-py__P75fvD3', 'polyglot-c-py__ZW56kRb', 'polyglot-c-py__7ABLfAH', 'polyglot-c-py__2h69Gty']",0,"[514.70736, 570.089975, 900.039161, 900.144219, 438.353602]","[31.111279, 24.311702, 34.853574, 31.337492, 20.094416]",0.0,False,[] +gemini-2.5-flash,polyglot-rust-c,5,"['e254e52e-f245-4916-9fe4-c0fe15f0a6c1', '6358a638-898e-470f-8e83-71e5ed5da4e6', '183a74b1-e151-4dcb-a3eb-866e516d67a4', '21bd5aa3-4449-4842-860c-992f1226eebc', '36f36bc0-00f8-4f7c-9be2-e32bdf87c159']","['polyglot-rust-c__63oLtWd', 'polyglot-rust-c__wpX2xRU', 'polyglot-rust-c__f5JqJ9V', 'polyglot-rust-c__YsqHVMn', 'polyglot-rust-c__Zdih5gL']",0,"[900.939822, 207.448773, 936.539184, 905.820841, 905.47061]","[136.508478, 77.642753, 82.608462, 293.851148, 86.707079]",0.0,False,[] +gemini-2.5-flash,port-compressor,7,"['f932b575-ef40-4f3a-9133-6208bf3e0a24', '555b77eb-5c3d-4a4e-b4c9-ea03b9be4b2c', '088e3e03-89f2-40ec-9469-a86763ad9b58', '6838a0a6-0790-41da-9d9c-f68bd8f86637', 'c37d6317-c16e-43d4-842e-c6099c93f886', '38efde58-2307-4391-a382-738774025928', '419a276c-f7b8-49cb-8322-453920037ace']","['port-compressor__CC7YHQH', 'port-compressor__CzH7wcS', 'port-compressor__4RVSLKk', 'port-compressor__knKEXAH', 'port-compressor__GsSiuKA', 'port-compressor__PrU4tbS', 'port-compressor__os2RVJ4']",0,"[3632.902595, 3600.001834, 3600.001766, 3601.907017, 3601.932202, 3600.753661, 3600.002826]","[56.515079, 11.027719, 10.414741, 137.557463, 183.985849, 71.953327, 50.328363]",0.0,False,[] +gemini-2.5-flash,prove-plus-comm,5,"['5729b407-921a-484f-b68e-3b562602a700', '927ad9a2-0bea-4e6a-9029-d5d987079509', '55b022c0-cf29-431d-8fb3-cb8f4e791acd', '00dab5a2-1493-4eaa-ac3a-1753dc0afc40', '99adc89e-1af6-42ec-97ca-16e808ff80f5']","['prove-plus-comm__PWVX2ff', 'prove-plus-comm__LXFyvhP', 'prove-plus-comm__9Uc6ABk', 'prove-plus-comm__ZjjUBig', 'prove-plus-comm__8m5bqEP']",3,"[90.077706, 689.669266, 900.030109, 195.506131, 307.628228]","[14.037948, 10.09136, 35.801505, 59.856535, 22.222995]",0.6,True,"['5729b407-921a-484f-b68e-3b562602a700', '927ad9a2-0bea-4e6a-9029-d5d987079509', '99adc89e-1af6-42ec-97ca-16e808ff80f5']" +gemini-2.5-flash,pypi-server,5,"['3554d0d3-49c2-4c35-b1e8-b114edcccde7', '18e99116-2877-467f-beb1-35ef6e60aa20', '5ad21587-315d-4ece-894e-af0af09b3e77', 'f342cf95-6730-4acf-9f29-c4f95bbfe419', 'de9ae622-be1b-427e-8956-ec9391d0dff9']","['pypi-server__mDMzRWb', 'pypi-server__7HpXfQx', 'pypi-server__D2tmiry', 'pypi-server__DxtvRCC', 'pypi-server__xBpY35X']",0,"[460.690822, 659.650635, 376.132343, 902.599329, 122.966065]","[14.3, 36.842329, 72.097689, 29.425601, 47.253909]",0.0,False,[] +gemini-2.5-flash,pytorch-model-cli,5,"['baa9e22c-fdca-4106-8713-fd1d9f18055d', '5e80d518-20df-4262-bf89-ef61cfa5af80', '3fb3b8e3-1895-4e47-af1a-923e770ef1ff', 'db1d9636-215f-4977-930e-937bbc1f6a65', 'eedbf001-f093-4294-9075-39bd749df56e']","['pytorch-model-cli__zW6PvRi', 'pytorch-model-cli__5yiLb3L', 'pytorch-model-cli__t9k49ZT', 'pytorch-model-cli__jvabJLh', 'pytorch-model-cli__B9xQiae']",0,"[137.913301, 887.785892, 207.06433, 107.20064, 159.941768]","[134.64795, 87.012576, 72.671134, 45.314952, 682.482624]",0.0,False,[] +gemini-2.5-flash,pytorch-model-recovery,5,"['fd44c5eb-2a25-4727-a1af-132a49b9d806', '9d8844cf-a603-4d51-a136-a18e75d3c67b', '3c4c26ed-5b4c-4d86-a976-10f834b4aaec', '9eedf61d-f886-4eb5-a63e-ab796ff7ebc0', 'bed85c80-9363-4acf-849f-5369fe2221d4']","['pytorch-model-recovery__ryio6Q3', 'pytorch-model-recovery__jTvAAEY', 'pytorch-model-recovery__hqh3Uoq', 'pytorch-model-recovery__HrtDmaj', 'pytorch-model-recovery__JD8kVpy']",1,"[910.551912, 900.007547, 640.553611, 900.953317, 903.391383]","[45.52182, 35.857597, 11.998866, 70.045287, 53.709808]",0.2,False,['3c4c26ed-5b4c-4d86-a976-10f834b4aaec'] +gemini-2.5-flash,qemu-alpine-ssh,5,"['f606f3a7-6266-4c9b-a396-2342709cf3dd', 'eec40351-5054-4e5d-97df-533199651f11', '13462627-1abe-46f7-b809-0fe5957216fb', 'aaeba6f7-a66d-4806-ac10-9a74ec798f11', '043a46ec-1d45-4bc7-b47e-950dddd336ec']","['qemu-alpine-ssh__D3KHV8p', 'qemu-alpine-ssh__cbbwNes', 'qemu-alpine-ssh__efCA6FD', 'qemu-alpine-ssh__X3Npc3D', 'qemu-alpine-ssh__LB7HFrk']",0,"[902.515037, 302.902164, 193.816308, 186.207167, 282.816872]","[9.931584, 25.123254, 6.077009, 9.629589, 5.001292]",0.0,False,[] +gemini-2.5-flash,qemu-startup,5,"['8dca7f3b-0e4f-4fef-b804-f6961fbd70a1', '66bd91ee-0855-4753-ad0f-ab6ae82509d0', '0220ba0e-a034-4a0e-b31e-0b5e446e45cc', '911113af-fb85-422f-b760-17ade4dea452', '3531b50a-5316-4e50-859c-1a99575eb5fb']","['qemu-startup__2A4Z3oF', 'qemu-startup__Npjtj32', 'qemu-startup__fhZ6C2R', 'qemu-startup__tSayziH', 'qemu-startup__JTGmHs8']",1,"[164.075666, 232.744757, 81.959598, 138.383353, 122.717458]","[13.410226, 20.697891, 36.074955, 3.065949, 18.511933]",0.2,False,['911113af-fb85-422f-b760-17ade4dea452'] +gemini-2.5-flash,regex-log,5,"['d9f7fabe-ee30-4f99-ad6f-6cb263593be2', '8bf3ccaf-39fc-4353-9c94-6d78f0b1b8fd', 'c4a902a0-d8a6-4df4-ab3c-2b61f2bea217', '3b215da4-7131-43c4-a290-8a206faa1157', 'b95d8ecb-e09b-413c-8ab1-b4d23f719401']","['regex-log__HM8fMw9', 'regex-log__x2krWnY', 'regex-log__dZqm3CM', 'regex-log__jEcHckU', 'regex-log__iRGjmvn']",4,"[59.872783, 150.324853, 115.098416, 119.21774, 232.693721]","[190.852631, 84.743626, 138.689703, 22.126005, 124.04175]",0.8,True,"['d9f7fabe-ee30-4f99-ad6f-6cb263593be2', 'c4a902a0-d8a6-4df4-ab3c-2b61f2bea217', '3b215da4-7131-43c4-a290-8a206faa1157', 'b95d8ecb-e09b-413c-8ab1-b4d23f719401']" +gemini-2.5-flash,reshard-c4-data,5,"['4244576d-586c-4f42-ac93-0c4ded3eead1', 'd4164b69-d8c1-442b-8f5a-60cee6e144d7', 'f569ab9b-964a-4a0d-a1e8-dd50f8327ff4', '8d8c0b1a-fe79-4119-8d90-d66b3fb99ba3', 'a67f954c-f839-4f6d-a842-6c7e0d819d11']","['reshard-c4-data__4ZVahiz', 'reshard-c4-data__S2dQEqc', 'reshard-c4-data__WHEMkSf', 'reshard-c4-data__htfmwtR', 'reshard-c4-data__4hL99se']",0,"[687.971142, 332.95525, 338.965268, 228.45223, 698.202098]","[152.836402, 23.883506, 23.87609, 102.197011, 100.484352]",0.0,False,[] +gemini-2.5-flash,reverse-engineering,5,"['308ba5ce-bf4f-44ed-ae89-4e40c60681f6', 'edb0b564-8acb-4163-9cf2-d6e1e808fb80', '405403de-3306-45bb-b4ee-d0b097e5f5b8', '56725b80-24a6-40b8-93a0-3a1a48cc0bb5', '188e7f6b-3b3e-48fb-a597-d848d8ec37a1']","['reverse-engineering__7TjET79', 'reverse-engineering__KWbkAz6', 'reverse-engineering__6H6r9Qy', 'reverse-engineering__VXRje2u', 'reverse-engineering__JbEnjyX']",0,"[1802.238321, 3721.991091, 727.750811, 1805.078216, 1805.156647]","[24.620833, 25.302125, 12.072253, 44.552771, 25.77396]",0.0,False,[] +gemini-2.5-flash,run-pdp11-code,5,"['71d1aa7d-b7b6-40ec-bc4d-1bc3524df738', 'd613cc38-4fa2-498a-9974-7a45106c6241', '9a6f79a5-5447-4a34-b6a6-5d8f9d20672d', '762cf99c-0f31-4a46-b12e-9d77cbab715b', 'a11648c9-06fc-4c98-b81f-04eb1403f241']","['run-pdp11-code__65LRtGF', 'run-pdp11-code__rMsgmep', 'run-pdp11-code__gULNFyG', 'run-pdp11-code__ZJmAsN9', 'run-pdp11-code__3wgRM5F']",0,"[201.115824, 1009.787953, 848.854832, 346.061229, 199.612664]","[25.427637, 305.48037, 17.456331, 109.208612, 153.766583]",0.0,False,[] +gemini-2.5-flash,sanitize-git-repo,5,"['09166cd3-0460-46df-9232-8f16174a02ae', 'd84c23f3-dccb-4731-9ef9-9ced1bc7aae1', '4e72d6df-728e-4dc0-b20c-300dc694fb78', '8cad6437-ceed-4123-9a83-ec4f36f5e90f', '4aac4a6e-83bd-4671-89b1-466635dea80b']","['sanitize-git-repo__LuBBSA9', 'sanitize-git-repo__mQ6Ki7X', 'sanitize-git-repo__FPN6dUQ', 'sanitize-git-repo__QPngkon', 'sanitize-git-repo__UHDZCRs']",0,"[139.677482, 405.136463, 233.104675, 231.436895, 440.454082]","[41.162103, 33.775775, 148.692751, 30.989571, 262.594191]",0.0,False,[] +gemini-2.5-flash,schemelike-metacircular-eval,5,"['83707105-078e-45b3-ac52-7d32d7067d23', 'b63b9979-6887-48d0-89a0-04aad774acb9', 'cd1509f6-d2bd-4001-bb24-77d140667d78', '65b2f282-c1a8-4eba-ad74-8823dc4a2124', 'a38a3cae-6291-4236-9e2d-3d4383388866']","['schemelike-metacircular-eval__jT6nAhD', 'schemelike-metacircular-eval__HSpuLie', 'schemelike-metacircular-eval__4yDuqnF', 'schemelike-metacircular-eval__GXFXvAy', 'schemelike-metacircular-eval__UXGHkUb']",1,"[406.40546, 2411.472757, 2424.79551, 2407.326708, 2401.401767]","[98.782261, 45.887562, 58.763009, 27.646512, 28.029016]",0.2,False,['cd1509f6-d2bd-4001-bb24-77d140667d78'] +gemini-2.5-flash,sparql-university,5,"['e0d295a4-a48f-4d07-8014-fb0ba5dd65bb', '3284c740-abed-4169-ba43-543fd7b71ec3', '2e71fcaf-1f3f-437b-816d-23f5499b06e5', 'e538dc23-d30d-455f-a5d0-b9f6f064f353', '8ea03f3f-2acc-4739-be0e-f4d728b16fdd']","['sparql-university__p5FM8LR', 'sparql-university__E7qFjQH', 'sparql-university__MvQX4Y9', 'sparql-university__BzAAFjF', 'sparql-university__YA8MZ9n']",0,"[116.44352, 142.54112, 161.246405, 56.828186, 415.639648]","[52.624175, 35.883006, 47.792354, 27.875255, 88.507782]",0.0,False,[] +gemini-2.5-flash,sqlite-db-truncate,5,"['7c99ef96-5e2d-4153-b333-b974b4b93aa4', '3f7f6b20-2f2f-4152-83c3-86a307d0bb37', '0d0d1e25-9944-4d83-bfc5-0f1630e89e53', '416ac3f4-67b2-4ee6-b8e2-a7803e3f3d8f', '06699cc0-3120-4981-b472-ea34cfb93287']","['sqlite-db-truncate__76YrZvP', 'sqlite-db-truncate__2uUzrWf', 'sqlite-db-truncate__DQ9CRPe', 'sqlite-db-truncate__dEfiCJP', 'sqlite-db-truncate__y3MSSNT']",0,"[408.856252, 135.79395, 696.936867, 924.676223, 451.915077]","[123.156041, 34.928528, 53.877474, 51.399126, 24.202631]",0.0,False,[] +gemini-2.5-flash,sqlite-with-gcov,5,"['0787e74e-4c3c-43af-8e84-fa92fbbc8d38', '5cd64d2d-72fe-4d1f-88c7-2b8aa81ef600', 'e53aec63-bc73-4458-b831-2633666456bb', 'd23f9451-2e4a-40ed-a04c-7b567b8f2b80', '4a7d9634-bd75-4a1f-887d-f2e90f5769c7']","['sqlite-with-gcov__cPZvmfz', 'sqlite-with-gcov__UyN9APx', 'sqlite-with-gcov__MyPXBPm', 'sqlite-with-gcov__RLogXyw', 'sqlite-with-gcov__ATHwPag']",1,"[164.43347, 310.82023, 83.353124, 203.85763, 529.576716]","[64.175549, 148.349804, 45.534422, 45.648813, 61.916064]",0.2,False,['d23f9451-2e4a-40ed-a04c-7b567b8f2b80'] +gemini-2.5-flash,torch-tensor-parallelism,5,"['4eef11eb-05b9-45d2-84df-259ca47465ac', '5be71768-fa15-449d-b181-b3c3c0d61275', '420bd9ae-c0b3-4f5d-9d4c-a2eb37dedc52', '18ace2db-d5cf-4c41-b48e-075548cb28ab', '5d857a44-8392-437f-95e9-49a69092d33e']","['torch-tensor-parallelism__b5Knj9g', 'torch-tensor-parallelism__MeJPER4', 'torch-tensor-parallelism__7L7dXyT', 'torch-tensor-parallelism__3FEMTfj', 'torch-tensor-parallelism__nzHwh5Q']",0,"[367.071263, 783.1688, 106.718819, 67.658286, 902.001107]","[37.699936, 45.252802, 48.090065, 32.329489, 58.720375]",0.0,False,[] +gemini-2.5-flash,train-fasttext,5,"['8c1ffa77-d7a4-4fd5-911f-c02f395e16cc', '8c930c71-8f4d-4673-a961-0df31f2c83c0', 'de14ffb1-1ad4-4839-8200-6e70b0f2ea84', 'bd7138f8-a29d-4a6a-83aa-dd9c2f4137e1', '5de96757-f791-4e8e-bad9-4fd5e5dc3448']","['train-fasttext__MfhpVrU', 'train-fasttext__KjJnGEW', 'train-fasttext__JYtUrUT', 'train-fasttext__UJB6dVQ', 'train-fasttext__BfLBEXX']",0,"[1105.799926, 3602.355845, 1332.157481, 3602.629325, 3643.970918]","[112.94885, 20.036513, 61.784417, 155.539048, 22.650909]",0.0,False,[] +gemini-2.5-flash,tune-mjcf,5,"['af3b68f1-396c-448a-9dda-8d24dd3648d7', 'd58a0742-3aac-4205-8809-bbd6a2dd6e0c', '4ec8a64f-1f87-4482-b9d3-044b2fb5b984', 'f652c17f-8af2-414e-8c2b-3b87c4c9fd96', '0540ddf3-3bee-4a30-be57-4e75b7dd4ce7']","['tune-mjcf__CJvBEXF', 'tune-mjcf__5RCxqv7', 'tune-mjcf__5V5t4Mi', 'tune-mjcf__jC38jwj', 'tune-mjcf__wCyvK8d']",3,"[338.635574, 579.517125, 471.552013, 608.146811, 967.592017]","[14.623899, 15.856917, 9.652158, 51.303426, 31.261997]",0.6,True,"['af3b68f1-396c-448a-9dda-8d24dd3648d7', '4ec8a64f-1f87-4482-b9d3-044b2fb5b984', 'f652c17f-8af2-414e-8c2b-3b87c4c9fd96']" +gemini-2.5-flash,video-processing,5,"['8dcf4c5e-4ff7-45d9-9cc3-2f210e7b6330', '7c8dd4b4-aab5-4f7d-bf94-573bb0883b57', '1965159e-f932-4aeb-8d8c-d239215dd483', '5b464a34-6c95-410f-bc96-f8724038d091', '93065444-5a6d-4e75-a99f-1399973871b0']","['video-processing__aaSRCx7', 'video-processing__9g7wfuS', 'video-processing__yWUjVWT', 'video-processing__FUBob2R', 'video-processing__6rtGrws']",0,"[144.336566, 211.800366, 163.565985, 227.169432, 130.618015]","[160.142337, 25.371176, 53.589249, 71.74622, 12.664187]",0.0,False,[] +gemini-2.5-flash,vulnerable-secret,5,"['bbe7d28a-4681-4069-a6e6-89afd10b8cdc', 'de09ea5d-cf82-492e-8481-85787f7476f5', '3943b20c-5e58-43e3-9076-ccef81806721', '00dde788-6d08-4d72-952f-c1605da7bc3b', '1f32547e-f906-4a8e-8c53-b29d9adae5dc']","['vulnerable-secret__pKRjC9z', 'vulnerable-secret__v6iiP7B', 'vulnerable-secret__vCTYs8C', 'vulnerable-secret__4a3MiR5', 'vulnerable-secret__WuLoE2m']",0,"[907.595431, 921.406055, 900.256038, 907.901601, 906.549594]","[10.485163, 80.009727, 67.625971, 23.981547, 17.290419]",0.0,False,[] +gemini-2.5-flash,wasm-pipeline,5,"['0da3030f-abda-4a61-a575-ff94f85b833a', '46a5d097-aa06-4f7a-83af-ffbff2c96450', 'ca3764f9-cfd5-424e-bffe-0bb6cc8809e1', '845da8d8-487b-4667-870b-e9582cae3407', '40cb4c1f-9bf1-40a5-bd54-c385e8b283a0']","['wasm-pipeline__KfhS4jX', 'wasm-pipeline__VsZYkV3', 'wasm-pipeline__3qwt2Fx', 'wasm-pipeline__NuQGUC9', 'wasm-pipeline__MgYCnq4']",2,"[883.290468, 111.127443, 386.865551, 900.037555, 682.407067]","[12.285576, 2.071831, 45.582099, 17.558079, 14.694503]",0.4,False,"['ca3764f9-cfd5-424e-bffe-0bb6cc8809e1', '40cb4c1f-9bf1-40a5-bd54-c385e8b283a0']" +gemini-2.5-flash,winning-avg-corewars,5,"['f3a9382a-a286-4120-8504-083298757995', '24fe1f4f-ac82-4a49-997c-b9e0d0279746', 'b16bec4f-7de1-4ee8-a6a0-1b6fd638b1dc', 'b6f70425-b2ed-4016-a90b-cc22140af471', 'ceab9c91-1690-4a62-8f30-334eb48874d0']","['winning-avg-corewars__4cPKG8Y', 'winning-avg-corewars__kdBXksd', 'winning-avg-corewars__nqiqFmt', 'winning-avg-corewars__cKQ9PZz', 'winning-avg-corewars__s4mFM24']",0,"[3639.669892, 3625.773378, 952.083953, 3600.201056, 2630.333253]","[172.397374, 4.854323, 31.643622, 64.323011, 54.804372]",0.0,False,[] +gemini-2.5-flash,write-compressor,5,"['529149a0-446d-4b3f-a6c9-fb67935eb125', 'caa90f1a-6279-4eae-bb47-a68dfac3e0ac', 'f83bb266-d229-493b-af2f-7706a9625baa', 'fa8a7c63-a42f-4903-95f3-8b0c4dd7755a', '9c5e1511-769a-46ef-bdf9-e99f40d6af62']","['write-compressor__vFpEAzQ', 'write-compressor__aebZWvx', 'write-compressor__V3iteav', 'write-compressor__sExxkqi', 'write-compressor__e2sU3RY']",0,"[900.860191, 917.835988, 900.214951, 907.29728, 825.210902]","[103.840087, 28.359317, 46.657638, 26.268682, 45.630133]",0.0,False,[] +gemini-2.5-pro,adaptive-rejection-sampler,5,"['e69573f8-1005-43c1-97a6-de53ad690f46', 'f002ec63-b254-4a29-91e2-ca2c8cc3ab11', 'cebc8fed-ce0f-4dd8-aaa9-7f920a8da2b9', 'f2829ebc-d8a0-4a5b-8eb7-46e0bf85a454', '1cba150c-69a1-416e-b05a-0bf94c6090a3']","['adaptive-rejection-sampler__e8jmkNE', 'adaptive-rejection-sampler__suWp9Bf', 'adaptive-rejection-sampler__fQNDkHh', 'adaptive-rejection-sampler__fJmoviX', 'adaptive-rejection-sampler__RJsQRiz']",2,"[526.494362, 900.03646, 906.747334, 917.26487, 774.267194]","[64.64703, 138.933384, 24.112169, 38.067705, 52.348089]",0.4,False,"['cebc8fed-ce0f-4dd8-aaa9-7f920a8da2b9', 'f2829ebc-d8a0-4a5b-8eb7-46e0bf85a454']" +gemini-2.5-pro,bn-fit-modify,5,"['cad02dd5-5fbb-4a25-81b3-d19768f5577f', '2aed27f3-8026-448e-94dd-e21e7fbd3957', 'c29606d9-d129-4004-8c1c-fed9af885f20', '71ba4fdb-231b-4d62-865a-07d941082ef1', '007a88ca-44bb-421a-bb4a-039c5eb8cd68']","['bn-fit-modify__iWSD23A', 'bn-fit-modify__h2yRfJd', 'bn-fit-modify__yF5UDfa', 'bn-fit-modify__8i2nY2e', 'bn-fit-modify__TTwYVrw']",0,"[3181.10882, 1886.47887, 2057.063295, 1141.810501, 3511.16303]","[47.83962, 65.308644, 45.361749, 210.254512, 13.740454]",0.0,False,[] +gemini-2.5-pro,break-filter-js-from-html,5,"['2f042871-257d-4970-afd8-a566d86676a0', '8343a0c3-2e37-4db1-8fcf-38e5d8ec53c0', '71b785c4-06af-44f2-9150-00a8a6e10302', '8027bb23-315d-40b5-99c0-4a04fbd15e2b', '73adb208-b1e7-4021-b87a-e97fb65d926b']","['break-filter-js-from-html__CvoMqgV', 'break-filter-js-from-html__GYPgkxy', 'break-filter-js-from-html__HofcwGP', 'break-filter-js-from-html__dtNpjhh', 'break-filter-js-from-html__Z4Qcubu']",1,"[977.348113, 346.544619, 182.090463, 1203.268636, 1206.644112]","[67.877776, 13.121558, 55.903134, 80.773145, 221.329925]",0.2,False,['2f042871-257d-4970-afd8-a566d86676a0'] +gemini-2.5-pro,build-cython-ext,5,"['f6267b9b-acac-4681-bc23-6ff71e6b2205', '1a4a0c7e-5956-4477-ae6a-ae45a1b40979', '8930e099-3045-4cb6-b040-0a8b467e92fb', 'ea493867-f535-4e01-bf8c-9778da51c90d', 'aae236ea-eb56-4b19-81e3-659dbdf2e053']","['build-cython-ext__mBnVNAL', 'build-cython-ext__s6cQHqq', 'build-cython-ext__VfnvGMa', 'build-cython-ext__VzZLCA7', 'build-cython-ext__dnpPiUv']",0,"[907.970203, 789.476067, 596.690821, 930.140354, 807.617293]","[162.349234, 163.54672, 8.222148, 55.710573, 104.944242]",0.0,False,[] +gemini-2.5-pro,build-initramfs-qemu,5,"['8b737da3-a70e-49e7-a047-d8094973eec4', 'f51d2b46-f004-41e9-8e58-d9bb4c8e4b6e', '67ca3e36-deeb-43d0-b3b8-a4642d191ef8', '9e6df700-6705-4b41-b1cc-467fb1074b63', 'd6b43375-583f-41ed-be41-3c2ab2f4c6f5']","['build-initramfs-qemu__hha3P4n', 'build-initramfs-qemu__kfiktLa', 'build-initramfs-qemu__xVneThU', 'build-initramfs-qemu__5nYi6NW', 'build-initramfs-qemu__qvQC6sU']",0,"[615.238579, 900.00074, 900.644562, 125.64759, 595.349904]","[82.370677, 11.223808, 79.42889, 13.582328, 32.450963]",0.0,False,[] +gemini-2.5-pro,build-pmars,5,"['d6667947-704b-4737-b0d3-9ea5e623a4b3', '7bb4f3b9-9ed2-4419-9f81-964eb277c6af', '1b77a840-a6f8-4e67-a279-8cf7823604c1', 'e617cf75-8156-4ae3-bb0d-683be8e2e998', 'cf78898e-2bfa-4a22-a682-d9f05c9fa5b9']","['build-pmars__CjCXaqe', 'build-pmars__VSuotju', 'build-pmars__RQcQfK2', 'build-pmars__ZbtXAJm', 'build-pmars__byNx8pF']",5,"[224.835783, 425.277691, 454.624491, 630.295473, 387.223245]","[4.609231, 4.662703, 6.373235, 35.541883, 36.62079]",1.0,True,"['d6667947-704b-4737-b0d3-9ea5e623a4b3', '7bb4f3b9-9ed2-4419-9f81-964eb277c6af', '1b77a840-a6f8-4e67-a279-8cf7823604c1', 'e617cf75-8156-4ae3-bb0d-683be8e2e998', 'cf78898e-2bfa-4a22-a682-d9f05c9fa5b9']" +gemini-2.5-pro,build-pov-ray,5,"['0140c865-fe86-4646-a5dd-27a9ff1abfca', '4988957b-82fd-4bd5-979e-309eefc512b4', '2303fae9-8cbf-4cb4-8140-a50cbbb4e319', '17d25f0b-4f3a-4708-8f4d-65e7b6572e9d', '4856feea-0627-412f-862b-7dc26e068df6']","['build-pov-ray__dTH4oSt', 'build-pov-ray__7KYJyhZ', 'build-pov-ray__DYpWJiy', 'build-pov-ray__MAp4pFJ', 'build-pov-ray__aKCmUCx']",5,"[571.150078, 1672.216476, 3241.614184, 1015.919214, 2019.230885]","[43.377666, 32.904326, 56.185703, 41.545895, 156.147907]",1.0,True,"['0140c865-fe86-4646-a5dd-27a9ff1abfca', '4988957b-82fd-4bd5-979e-309eefc512b4', '2303fae9-8cbf-4cb4-8140-a50cbbb4e319', '17d25f0b-4f3a-4708-8f4d-65e7b6572e9d', '4856feea-0627-412f-862b-7dc26e068df6']" +gemini-2.5-pro,cancel-async-tasks,5,"['0e937de3-87c8-4ecc-a861-41a9c8ebccef', '01b0549b-ac54-41f2-bc1d-9c4b9dbb6d60', '70120133-6e23-4b6f-9b31-77872a76daf9', '4f5b7a2a-8051-4fcd-bb1d-ba1bd243b33c', '319b341e-2566-4d2f-9691-c36d6122e1b4']","['cancel-async-tasks__CVnRWZT', 'cancel-async-tasks__KWPEYgv', 'cancel-async-tasks__krwGnGh', 'cancel-async-tasks__AeygyZr', 'cancel-async-tasks__ZohvFkM']",0,"[91.541084, 170.05352, 391.023943, 72.256043, 91.491076]","[59.674994, 45.149418, 315.695045, 95.168765, 100.804183]",0.0,False,[] +gemini-2.5-pro,chess-best-move,5,"['03676562-8dfd-41c2-813c-068d914ec293', '9b66bc7e-e7e5-4d0f-8331-0ce670317fc3', '05aa6231-d140-4980-9f9a-48de61adf1c7', '476eafbb-d551-42c7-8543-c1d791b4b995', '500ec7c6-b44d-432c-a63e-e8ceea9e9273']","['chess-best-move__cmXKDWF', 'chess-best-move__dnem77e', 'chess-best-move__T6kJEUq', 'chess-best-move__ontFAzf', 'chess-best-move__yGrptys']",0,"[901.276443, 906.223259, 658.742946, 446.379789, 920.806316]","[9.420855, 202.252495, 13.941719, 12.503394, 48.495549]",0.0,False,[] +gemini-2.5-pro,circuit-fibsqrt,5,"['a28c0ba5-3b17-4d8c-841d-5e2894c05fe0', 'e704bb7d-9eba-4933-acd0-dfe4bea28464', 'c068bfa3-5ca2-409c-999a-0d811c6ac76a', 'afa51c2f-fa37-46ce-9d2f-6f132d35cf87', '5d203aaf-d47f-4e4f-bb7b-8d466266e66f']","['circuit-fibsqrt__TuT7Cvr', 'circuit-fibsqrt__FhFwdZf', 'circuit-fibsqrt__zBhAUwM', 'circuit-fibsqrt__ZubncBE', 'circuit-fibsqrt__JVjMHBk']",0,"[3607.193816, 3600.717217, 1048.719121, 747.144993, 266.591979]","[1415.571523, 38.923515, 48.704798, 17.593951, 37.189178]",0.0,False,[] +gemini-2.5-pro,cobol-modernization,5,"['85005041-a156-4014-a23c-38a277c4655b', '35726627-9bc4-45a5-8853-9782bb718b99', '48fc6838-ce69-4495-bff7-21cf134d6c6a', '70e3ed36-c854-4e7a-bb43-90fd8dc04dc5', '043d445e-c060-4c82-8e93-c61ef5faa29d']","['cobol-modernization__XqWgAuK', 'cobol-modernization__AuHwBYC', 'cobol-modernization__b3Gyc6M', 'cobol-modernization__U9YjzKN', 'cobol-modernization__ofBTP69']",5,"[316.468453, 343.081688, 420.1549, 913.022822, 376.961468]","[53.69416, 63.35875, 23.622137, 226.98697, 36.434139]",1.0,True,"['85005041-a156-4014-a23c-38a277c4655b', '35726627-9bc4-45a5-8853-9782bb718b99', '48fc6838-ce69-4495-bff7-21cf134d6c6a', '70e3ed36-c854-4e7a-bb43-90fd8dc04dc5', '043d445e-c060-4c82-8e93-c61ef5faa29d']" +gemini-2.5-pro,code-from-image,5,"['7fdac6dc-eb54-4b8f-bf04-393ca58b6afd', '7ec1dc23-8b59-4aec-b92c-399288c85d61', '4ae2c74c-06d1-463d-9b19-bf60401c71fa', '438136c8-3469-43f7-8342-8d2d3fbadce4', '6e48a98e-8902-45dc-8006-d0f97c9d8fd8']","['code-from-image__YCsV2or', 'code-from-image__Wu3VbiH', 'code-from-image__QSsyVQM', 'code-from-image__3QGHXcS', 'code-from-image__Y2KTjpE']",5,"[196.741165, 176.713528, 279.766914, 194.843998, 185.239353]","[47.432147, 38.58845, 23.91348, 20.921581, 73.874023]",1.0,True,"['7fdac6dc-eb54-4b8f-bf04-393ca58b6afd', '7ec1dc23-8b59-4aec-b92c-399288c85d61', '4ae2c74c-06d1-463d-9b19-bf60401c71fa', '438136c8-3469-43f7-8342-8d2d3fbadce4', '6e48a98e-8902-45dc-8006-d0f97c9d8fd8']" +gemini-2.5-pro,configure-git-webserver,5,"['59c2a27d-ff13-426b-b7bd-659205ca9654', 'e06368eb-39b1-409d-a8e0-2eb9a72a6e02', '9efe4e45-ceec-49f6-8708-d011da533647', '664b1a7c-a3f9-44b7-b27f-53010ecd4d04', '8207d8eb-e02b-407a-9c27-68fb53223489']","['configure-git-webserver__SnA7Wa4', 'configure-git-webserver__589LuMG', 'configure-git-webserver__AVbCnrD', 'configure-git-webserver__k3rLofL', 'configure-git-webserver__N7TgdBV']",0,"[308.296703, 394.346769, 273.775654, 794.839694, 228.676898]","[62.939998, 68.161627, 117.224727, 42.815367, 59.062088]",0.0,False,[] +gemini-2.5-pro,constraints-scheduling,5,"['be166240-44c0-47a6-9802-2086de981cc8', '764759d3-7ece-48fe-8d61-3079e4adfb4d', '1629cd15-cab0-4e66-ac31-b62e391a69e0', 'b94ba249-e720-483c-b322-88a76474fb89', 'ffcd079d-4317-47bd-858e-42585a99765a']","['constraints-scheduling__qXTUgaX', 'constraints-scheduling__59Yubfn', 'constraints-scheduling__GnoDw2A', 'constraints-scheduling__FfkDgmP', 'constraints-scheduling__hYR9QH4']",5,"[497.636497, 380.134874, 476.403029, 299.170936, 524.276474]","[45.977021, 66.287766, 72.673223, 13.64652, 179.143596]",1.0,True,"['be166240-44c0-47a6-9802-2086de981cc8', '764759d3-7ece-48fe-8d61-3079e4adfb4d', '1629cd15-cab0-4e66-ac31-b62e391a69e0', 'b94ba249-e720-483c-b322-88a76474fb89', 'ffcd079d-4317-47bd-858e-42585a99765a']" +gemini-2.5-pro,count-dataset-tokens,5,"['3c9a3346-5d8d-46dc-a9a5-c38e1c76844f', '448acebb-68b4-4032-b948-f7c071e56d09', '58f55fcb-1a6f-4e3e-b988-68bc4fbb8b54', 'e83d15c2-7116-4d80-b00a-1b38b98b4200', '549c552d-4def-4ae6-a614-5f7d5988febb']","['count-dataset-tokens__gwkufwY', 'count-dataset-tokens__cSHoF6q', 'count-dataset-tokens__mcnrkob', 'count-dataset-tokens__rLzQarf', 'count-dataset-tokens__5TYKQE5']",0,"[905.098183, 900.227218, 910.470714, 904.549244, 902.980624]","[260.798769, 56.212727, 132.879295, 62.73524, 22.879226]",0.0,False,[] +gemini-2.5-pro,crack-7z-hash,5,"['4998705f-dfc2-4d43-9bca-1d2b5bd7d83d', 'a6e6f102-fd32-4f81-b389-2786ed6a5c07', '6d82c420-6c4b-4a56-9bee-b5848d2d647e', '4a54a613-a835-4723-84ea-dc8e3ee54a66', '4441684a-f656-4525-b1f5-a1838a6dca24']","['crack-7z-hash__a4mrSvK', 'crack-7z-hash__DLHgxhM', 'crack-7z-hash__xHyEx3a', 'crack-7z-hash__59s8im7', 'crack-7z-hash__FqoNwWi']",4,"[327.452375, 432.637942, 723.035224, 904.810536, 328.915003]","[11.12642, 46.054827, 68.514557, 18.16874, 17.074319]",0.8,True,"['4998705f-dfc2-4d43-9bca-1d2b5bd7d83d', 'a6e6f102-fd32-4f81-b389-2786ed6a5c07', '6d82c420-6c4b-4a56-9bee-b5848d2d647e', '4441684a-f656-4525-b1f5-a1838a6dca24']" +gemini-2.5-pro,db-wal-recovery,5,"['31abb7ed-a7dd-4710-ae5e-767265e5c6e9', '365a54ec-e6b1-4c0d-811b-bdc50aabc9da', '6e6d6d57-1538-4828-a31e-9f5deec24cd9', '03e402fe-73c6-4072-9199-8e51be1bf986', '58cc0734-7551-4fbc-8ef3-acb1910588df']","['db-wal-recovery__Hma5Tyj', 'db-wal-recovery__a5o4Pkv', 'db-wal-recovery__nz4DT4k', 'db-wal-recovery__jJFwMyo', 'db-wal-recovery__ByoYUKg']",0,"[462.198917, 906.509691, 903.184844, 902.236578, 900.031961]","[14.164981, 98.368563, 56.09972, 15.125195, 202.184359]",0.0,False,[] +gemini-2.5-pro,distribution-search,5,"['abb5fa06-95cd-4911-b085-7ab0e2d7520c', '09378996-e8f7-4e81-9a54-2b257883276f', '8ffd70e1-c0a6-4b76-adf3-92848f6c5f9b', '57191ccb-e58b-4421-a92e-49d6b0220b21', '0335783f-744b-44be-b8ad-9a0ff983e200']","['distribution-search__5HJcUT6', 'distribution-search__NTnxsrX', 'distribution-search__G8kdRCb', 'distribution-search__8BpsHeX', 'distribution-search__nMpovfX']",3,"[748.86701, 1231.011082, 180.449652, 641.21183, 356.706715]","[27.462067, 154.725048, 24.438852, 29.90952, 36.558273]",0.6,True,"['abb5fa06-95cd-4911-b085-7ab0e2d7520c', '09378996-e8f7-4e81-9a54-2b257883276f', '57191ccb-e58b-4421-a92e-49d6b0220b21']" +gemini-2.5-pro,dna-assembly,5,"['b09962d1-db36-4b8d-94a9-ac2032b0f516', 'f6e473ff-febe-4b9d-bce1-5289638617a9', '3f84f3d4-9993-4a5a-8b2a-fa35fb20b030', '25759d41-77bb-486f-abe6-672138e141d6', '86465dc4-c277-474b-abad-8aecd61bc1c8']","['dna-assembly__NvBmoFK', 'dna-assembly__89Yf9uv', 'dna-assembly__ajGzxyj', 'dna-assembly__FbdDnqu', 'dna-assembly__s7pQZum']",0,"[451.541357, 749.84186, 269.538427, 657.69496, 434.661754]","[24.910604, 19.952894, 180.564112, 82.984113, 64.063743]",0.0,False,[] +gemini-2.5-pro,dna-insert,5,"['67e5c801-6eae-491d-b3bb-74a6ed2e3114', '1b2f8bc8-778e-4965-b0f7-fd8865be8a0d', '7003de2c-f21a-47a1-8f84-e7328d41e32f', '83d5a3ac-f0a9-477f-8ee7-f4d2d74a0c4a', 'cdf58378-9ea2-4597-960e-503d786bcdc4']","['dna-insert__xvBhKc2', 'dna-insert__EmyMrVG', 'dna-insert__aqExgLA', 'dna-insert__dSxTjrP', 'dna-insert__HjWCiUc']",0,"[364.122258, 368.076838, 377.755718, 290.502575, 374.329582]","[28.019612, 15.558229, 46.804777, 70.095505, 284.051867]",0.0,False,[] +gemini-2.5-pro,extract-elf,5,"['1a30ce31-6524-4788-b1d4-39553d21138a', '96ccc7b3-5ebd-4602-85f6-930b024e1a7b', 'ec1afa10-40ef-4ae0-a918-f4dc7680160e', '6adae00a-f6b3-4370-890b-aaf8dc8758c3', 'c160dcdd-00fc-4e0f-86f4-515c46ec29f3']","['extract-elf__XUJVPBA', 'extract-elf__Km9ZTdP', 'extract-elf__CveMcbU', 'extract-elf__XayC3mE', 'extract-elf__WWx6QFr']",0,"[281.684665, 900.276668, 825.739477, 245.914217, 356.41755]","[160.687086, 13.628371, 55.350327, 23.660235, 109.056229]",0.0,False,[] +gemini-2.5-pro,feal-differential-cryptanalysis,5,"['4cfcb1c8-ecc2-4140-a97a-39357b396022', '2604cc6e-eaaa-4f21-856b-452c53472eb6', '5a9b04fb-eba8-4f4b-a193-2c333963598c', '622b84b3-7a4e-4b5e-8804-c81199a26874', 'f5973661-ad82-452f-a89e-0430ac60ffd7']","['feal-differential-cryptanalysis__GG6rWPm', 'feal-differential-cryptanalysis__b3VPBi7', 'feal-differential-cryptanalysis__e7iRbmp', 'feal-differential-cryptanalysis__jRifVmM', 'feal-differential-cryptanalysis__PcqmSdh']",3,"[1157.066908, 669.841014, 496.416113, 751.377285, 477.303108]","[35.65185, 118.736237, 23.025945, 119.566557, 212.072632]",0.6,True,"['4cfcb1c8-ecc2-4140-a97a-39357b396022', '2604cc6e-eaaa-4f21-856b-452c53472eb6', '5a9b04fb-eba8-4f4b-a193-2c333963598c']" +gemini-2.5-pro,feal-linear-cryptanalysis,5,"['90c3c2ca-b2f1-4700-b045-a8c89364cddd', 'c378e4f4-6428-436f-a9c7-a5a64f70b4b4', '0bd10e96-f7cb-4d56-b1e7-6453483922a1', 'b6680e56-4e5d-4989-a83e-94870532d35e', '4345f2dd-9537-4ff5-a854-f2482b6b02e8']","['feal-linear-cryptanalysis__Z6SL62q', 'feal-linear-cryptanalysis__s7nhHew', 'feal-linear-cryptanalysis__afPTP6d', 'feal-linear-cryptanalysis__MprN2dL', 'feal-linear-cryptanalysis__RbRzFYt']",0,"[1801.078126, 1408.283413, 1802.292989, 1810.216043, 1819.861515]","[21.217866, 117.755877, 314.917732, 29.183672, 102.957782]",0.0,False,[] +gemini-2.5-pro,filter-js-from-html,5,"['87463878-f622-4fa2-9a55-ee58363edc97', '7587ebcd-3cab-45c3-88b5-5b5000c5266b', 'ff9f5194-ac5f-46b7-bec8-4931295074d3', 'd5a94c8b-374e-4719-96ce-8a6c3677d366', '671d6d8a-184a-4e08-8294-a0394813d0a3']","['filter-js-from-html__EsxAj5n', 'filter-js-from-html__ZnascZk', 'filter-js-from-html__8B9Sc2R', 'filter-js-from-html__bTWeKJy', 'filter-js-from-html__7u9hGqB']",0,"[95.371836, 172.377752, 678.564274, 135.518955, 452.584749]","[67.248202, 57.977189, 43.773345, 37.276222, 33.314077]",0.0,False,[] +gemini-2.5-pro,financial-document-processor,5,"['9b253c0b-3f1e-43ce-ae61-83b9ce41065d', 'a76c1ffd-65f5-4a2a-827d-42e0cc3625d9', '3e244d06-820d-4147-836e-d007dac9cc59', '01b691ca-923b-411d-9559-ab2dc1c12dea', '34fd79dc-26d3-4791-9b3a-a187d8d5dfe9']","['financial-document-processor__fprk6yy', 'financial-document-processor__6kY5iN7', 'financial-document-processor__3jWW4ER', 'financial-document-processor__NLHXuWb', 'financial-document-processor__uPrDUqh']",0,"[546.588775, 557.748855, 531.094791, 463.530648, 1206.472336]","[30.671903, 102.228523, 99.923523, 22.110132, 28.78583]",0.0,False,[] +gemini-2.5-pro,fix-code-vulnerability,5,"['2d5a8aa2-5da4-481f-8904-73106e06fd73', 'e7beaccf-489a-4aab-b96f-2bc53f170894', 'eb3ee69a-a2c9-4619-a2db-a0d92cc6c8a0', 'a8eeb70d-baf1-4ee5-9d4c-42cabd86063b', '76320ab6-3367-459c-9433-ebdf7a882529']","['fix-code-vulnerability__qvoPopA', 'fix-code-vulnerability__GcBNmNt', 'fix-code-vulnerability__jTeJfiP', 'fix-code-vulnerability__kvB78Vn', 'fix-code-vulnerability__US4Cc5V']",1,"[530.373659, 790.776486, 900.008762, 966.169399, 574.522182]","[36.95066, 15.698741, 3.877089, 61.539103, 39.055953]",0.2,False,['2d5a8aa2-5da4-481f-8904-73106e06fd73'] +gemini-2.5-pro,fix-git,5,"['d4f5757f-9a4d-46a9-ba71-47ad00e5fd46', '0295b1eb-f9b3-473f-b936-a8bf02c59d81', '9dbca2e3-c4f5-48ff-9ed4-d824c252c2c1', '379d7a79-ec80-46da-9518-1cae88098209', '8d0298d5-b7ea-4f08-9d45-d5aedae90dff']","['fix-git__EeVbABu', 'fix-git__F8CMNhh', 'fix-git__D4TzYM5', 'fix-git__ehhfdKf', 'fix-git__HnhkwP2']",5,"[143.464295, 143.803245, 146.54887, 141.68754, 142.166775]","[19.46231, 13.358938, 30.610556, 48.35522, 59.875217]",1.0,True,"['d4f5757f-9a4d-46a9-ba71-47ad00e5fd46', '0295b1eb-f9b3-473f-b936-a8bf02c59d81', '9dbca2e3-c4f5-48ff-9ed4-d824c252c2c1', '379d7a79-ec80-46da-9518-1cae88098209', '8d0298d5-b7ea-4f08-9d45-d5aedae90dff']" +gemini-2.5-pro,fix-ocaml-gc,5,"['54242fbe-3b51-49f3-ae49-4c54c815aa61', '3cd9e1da-2db1-4267-b425-db8c50092902', '192b6cc7-cb55-4ccf-974e-c67f8057cad7', '4d4a065e-bf91-4603-8a7d-744900717927', '0c88fe40-f7c2-4887-8365-e1d1e04dc572']","['fix-ocaml-gc__ftVK7nW', 'fix-ocaml-gc__vnL7pQY', 'fix-ocaml-gc__F2Ycckw', 'fix-ocaml-gc__uAYZEFA', 'fix-ocaml-gc__ACXiPWo']",1,"[3600.464048, 3600.095149, 3604.805525, 3600.001172, 1269.116548]","[25.992309, 81.803245, 60.028567, 45.264616, 32.745783]",0.2,False,['0c88fe40-f7c2-4887-8365-e1d1e04dc572'] +gemini-2.5-pro,form-filling,5,"['9b89f08b-6f11-4cd0-aa72-46d9326a3baa', 'f4ab7d8d-4c1f-439c-95bb-fb3bdfea7197', '5b597738-727e-4aa6-9030-1cfb8f8b2ac2', '73d81b14-c1fa-447a-9639-7347d2656249', 'edd375ed-ded0-4f7a-abdc-4974e03c75f5']","['form-filling__MBuU6RT', 'form-filling__d7dxBib', 'form-filling__9th4iio', 'form-filling__GXpcQJS', 'form-filling__F28nmdQ']",1,"[461.405179, 215.428702, 223.876052, 298.99749, 248.176906]","[35.855609, 4.867748, 9.350037, 17.547103, 4.158507]",0.2,False,['5b597738-727e-4aa6-9030-1cfb8f8b2ac2'] +gemini-2.5-pro,git-leak-recovery,5,"['39990a66-0bef-416f-ba42-7e832383a32a', '8c0ff9ee-3307-415d-ae8a-bfc0e59ec372', '9175c86e-8e5a-43f4-90e2-802bbae7f0a5', 'eede16e8-4c38-492c-80f5-4aeb09f8ebae', '5a1e5753-f730-46f3-bbff-8b85f290cddc']","['git-leak-recovery__KAfYUEc', 'git-leak-recovery__QbkMoGD', 'git-leak-recovery__F5rNbVz', 'git-leak-recovery__sPRCGXA', 'git-leak-recovery__8799sHo']",5,"[161.396977, 247.138438, 179.399228, 143.796337, 101.012342]","[40.250902, 90.769659, 29.520303, 60.536858, 180.877892]",1.0,True,"['39990a66-0bef-416f-ba42-7e832383a32a', '8c0ff9ee-3307-415d-ae8a-bfc0e59ec372', '9175c86e-8e5a-43f4-90e2-802bbae7f0a5', 'eede16e8-4c38-492c-80f5-4aeb09f8ebae', '5a1e5753-f730-46f3-bbff-8b85f290cddc']" +gemini-2.5-pro,gpt2-codegolf,5,"['ce45e7da-75b8-479a-905b-d50c058073b7', 'bd86c98c-2dc2-4204-ab57-36ea899eb2e2', '61cef84b-cbbd-4dc2-a0f4-9bb24abb4beb', '9bd77213-0756-4acc-85fa-af067cfada7a', 'df3c0244-2d9d-4197-a58d-aae134fb9012']","['gpt2-codegolf__3mux4F8', 'gpt2-codegolf__vYKjcRd', 'gpt2-codegolf__gpfb7Tt', 'gpt2-codegolf__RfzmGg8', 'gpt2-codegolf__s8JkJCn']",0,"[925.61234, 578.831026, 697.547094, 900.01824, 876.970709]","[53.513499, 317.705891, 23.844084, 186.067957, 88.506633]",0.0,False,[] +gemini-2.5-pro,hf-model-inference,5,"['0808b141-e692-4b10-9099-1a0756b10bc7', '7736d7f7-7c2c-4cf3-93ae-69259fcbd531', '8e34bbc2-6a7f-4a81-8622-3a503dc99f9b', '2db5ef23-ba6a-4401-bad6-0c2633e8ba49', 'dc8ff2d4-6f90-481a-870c-b4a6879ef177']","['hf-model-inference__6B5FVy9', 'hf-model-inference__hGNWyxc', 'hf-model-inference__S7pw5bV', 'hf-model-inference__crkgniE', 'hf-model-inference__soNJS3x']",4,"[385.675959, 409.329734, 162.783819, 900.775896, 298.582968]","[106.885602, 19.035863, 63.282812, 24.622973, 125.276207]",0.8,True,"['0808b141-e692-4b10-9099-1a0756b10bc7', '8e34bbc2-6a7f-4a81-8622-3a503dc99f9b', '2db5ef23-ba6a-4401-bad6-0c2633e8ba49', 'dc8ff2d4-6f90-481a-870c-b4a6879ef177']" +gemini-2.5-pro,install-klee-minimal,5,"['7d5be542-d466-448e-a3ff-90dcf5b16d34', '80dddf7a-6565-427e-916e-944b3f47539b', '94f6ca4f-80c7-43ae-a8a1-efe58bc63540', '6b3784ec-ec17-482c-92d8-89a5624f7112', '11e41d76-4685-452a-b9fb-83ff05e2516d']","['install-klee-minimal__Y4Ue6Ts', 'install-klee-minimal__56ED2ND', 'install-klee-minimal__pUhyGwH', 'install-klee-minimal__dM7RnB7', 'install-klee-minimal__PDajzqC']",0,"[900.284624, 900.390169, 900.181155, 901.982227, 902.006206]","[37.095102, 111.308001, 97.706537, 113.685406, 55.654758]",0.0,False,[] +gemini-2.5-pro,install-windows-3.11,5,"['30ccdbd1-60e5-449c-94ac-84642f8b8131', '588ead5f-6057-4782-9ef9-75c05f1c98bf', '5c7e79ec-3666-4fdc-8728-a8deed40d238', 'bf7cee47-a4d6-4b73-9a3b-fb9c6a3d64f7', '07c17916-c56d-420a-9f94-6d10577181e0']","['install-windows-3.11__zeTsQzV', 'install-windows-3.11__oHMSS8R', 'install-windows-3.11__fAzsnJF', 'install-windows-3.11__sbbtfZt', 'install-windows-3.11__CnyA6ap']",0,"[1216.939536, 902.519851, 530.952951, 3644.88457, 246.344728]","[131.003657, 29.718534, 40.487336, 46.133225, 26.119372]",0.0,False,[] +gemini-2.5-pro,large-scale-text-editing,5,"['1a8e28c9-d2e7-41aa-af05-1fe5c1c4b4f1', '493278cb-7d2b-41d7-89a3-6bbcc3368509', '11934b09-7fb4-4fb4-97d9-ded874403ba5', 'a2443d3a-6a5f-47ab-bfd9-871ed26d94f5', 'e3331a99-d920-4031-b3ba-45ff5e1a25a6']","['large-scale-text-editing__9iqBPbu', 'large-scale-text-editing__TCsHZ6B', 'large-scale-text-editing__7EMtZzM', 'large-scale-text-editing__otLHNLP', 'large-scale-text-editing__HM4YxLF']",2,"[1245.536666, 1242.73648, 414.049017, 238.957385, 426.761913]","[12.259454, 231.035237, 43.101307, 94.978174, 321.288271]",0.4,False,"['11934b09-7fb4-4fb4-97d9-ded874403ba5', 'a2443d3a-6a5f-47ab-bfd9-871ed26d94f5']" +gemini-2.5-pro,largest-eigenval,5,"['35692ba5-269b-42ed-9476-e649ecdaa753', '3b63fa9d-4a69-4516-b287-e02da3b7abbf', '13cc6e17-e2a7-40b2-83bd-08d1bef6960c', 'e6babc3c-9239-4b02-adde-6958d6581dea', '58b0f697-532c-4f2f-9210-02e3f189022b']","['largest-eigenval__Uez65MF', 'largest-eigenval__NA2Q6YU', 'largest-eigenval__AUQx5tK', 'largest-eigenval__wwV9FFA', 'largest-eigenval__e6oACgS']",0,"[913.605252, 900.000734, 904.484564, 919.057432, 901.384442]","[44.094531, 38.984451, 245.909832, 141.557337, 34.090777]",0.0,False,[] +gemini-2.5-pro,log-summary-date-ranges,5,"['dd6e062f-d678-4c50-8914-f8593e4bd2ad', 'd28f6ef7-a454-41a2-9937-a1473052751d', 'fd1d2ad9-8e48-482a-bbf8-13e6ea132bb5', 'a01331e5-dea6-4f81-8569-4a7e82ea9aff', '95d942a2-62c2-44d1-b4da-0453f0154f5d']","['log-summary-date-ranges__pmuSKo4', 'log-summary-date-ranges__mtCFJaE', 'log-summary-date-ranges__UZvYQcH', 'log-summary-date-ranges__3hCwUz3', 'log-summary-date-ranges__KqGnxGi']",0,"[293.474978, 210.256406, 114.233689, 368.290727, 392.271661]","[158.202639, 60.957608, 28.640931, 79.122958, 90.969136]",0.0,False,[] +gemini-2.5-pro,make-doom-for-mips,5,"['5251c4dd-3473-4146-896d-aa917a4ae002', '217a383a-2133-4d4f-af8e-dedcb8ee110c', '29e23bc8-878b-463b-8c3b-27f1dfd4ee7a', '1f283767-4817-4621-b07d-44965a467ca5', 'f7e478f3-c500-4543-b744-ac00c383c202']","['make-doom-for-mips__Jyiug8B', 'make-doom-for-mips__4M6pvoL', 'make-doom-for-mips__GtmrY2Y', 'make-doom-for-mips__CyGXan5', 'make-doom-for-mips__LYyv5pr']",0,"[901.588419, 1140.0117, 903.060768, 905.351779, 908.601223]","[230.944509, 37.75476, 117.941466, 68.267172, 37.127551]",0.0,False,[] +gemini-2.5-pro,make-mips-interpreter,5,"['cb0a7daf-a664-4f7d-868b-8a93287a02fa', '634f39b8-512a-4f46-8b0d-dbbed57ffd01', 'a0124f49-0031-49e3-8ba6-19596f24831c', 'cb7b9966-b944-41ca-8e17-b32721917949', '33e41779-9e60-4507-9a03-e1c45697ede4']","['make-mips-interpreter__bf6GoMx', 'make-mips-interpreter__AVsAQiv', 'make-mips-interpreter__uzeoByV', 'make-mips-interpreter__6gEoRTk', 'make-mips-interpreter__2oEgWWk']",0,"[1804.875428, 1802.37413, 1813.991046, 1084.159161, 1059.092077]","[36.92682, 19.345546, 99.819684, 241.434246, 84.035332]",0.0,False,[] +gemini-2.5-pro,merge-diff-arc-agi-task,5,"['78902d80-ee98-4957-be60-3963d6b9553a', '20f53b78-d932-4bdf-bd4d-ca39e6128522', '875fe2f9-879b-49d3-aea9-9a875ea7c4d5', '5fc11512-4b0e-4eb5-8313-398638a6adac', '517c2497-6f85-4980-a42e-8c6f39328a4f']","['merge-diff-arc-agi-task__WEbM9QN', 'merge-diff-arc-agi-task__FeCd6Ay', 'merge-diff-arc-agi-task__6eqXUwR', 'merge-diff-arc-agi-task__Ep6RNVJ', 'merge-diff-arc-agi-task__6Vmb48L']",3,"[870.074649, 791.547286, 301.771479, 255.241637, 919.659348]","[159.950216, 150.99585, 12.671516, 21.013093, 83.542439]",0.6,True,"['875fe2f9-879b-49d3-aea9-9a875ea7c4d5', '5fc11512-4b0e-4eb5-8313-398638a6adac', '517c2497-6f85-4980-a42e-8c6f39328a4f']" +gemini-2.5-pro,model-extraction-relu-logits,5,"['ba1d22d4-6360-4662-afb7-21f3ebc062d8', 'ec4ddbaa-eafa-4e8a-bd90-de2255a52fa7', '1c2a993b-c6b6-4ea1-bbd8-166d05ac01c3', '949cd74a-c571-4201-a276-5a1accf20e0e', 'bf25fe96-a679-445e-b299-25ffc963e6a0']","['model-extraction-relu-logits__FDiaUHH', 'model-extraction-relu-logits__PFJmfHC', 'model-extraction-relu-logits__5icCJCA', 'model-extraction-relu-logits__5FGnaAT', 'model-extraction-relu-logits__PUS8Wru']",0,"[537.082613, 1419.73534, 229.467774, 379.072137, 556.541947]","[35.563919, 15.097375, 28.176295, 98.413292, 61.620568]",0.0,False,[] +gemini-2.5-pro,mteb-leaderboard,5,"['379e18f3-942a-4915-b113-42d444932bc7', 'beb317dd-8cc0-4cd5-8fe2-49dbe4bfcbb8', 'fa533879-633f-44e4-9beb-0367d85fb7a2', 'e5adf4b0-6cf2-4dde-ab9e-9b4f751a65be', 'afaac7c3-cb40-4ff3-a4bd-3ba920347e6c']","['mteb-leaderboard__APnmMB4', 'mteb-leaderboard__6M9kkDx', 'mteb-leaderboard__UhTMzVX', 'mteb-leaderboard__L42b2PF', 'mteb-leaderboard__69RYLiV']",0,"[3606.706124, 2762.811167, 3619.546331, 1546.836951, 400.520879]","[13.678436, 4.36488, 17.58106, 2.886937, 6.576036]",0.0,False,[] +gemini-2.5-pro,mteb-retrieve,5,"['a43c3cf3-e59e-47d7-96e8-63d7f7571cee', '00814575-1545-4f5c-b500-9745e3084412', '3be62b55-b5fc-4363-85db-44fb31833124', 'b9d3c095-47bb-4b34-9e26-057d532b1467', 'cb437aa1-6441-4e43-bc41-145d50d03f97']","['mteb-retrieve__mKgm2No', 'mteb-retrieve__Lh5A4iy', 'mteb-retrieve__6vS6qo5', 'mteb-retrieve__ajkmwbn', 'mteb-retrieve__FDPSiqT']",0,"[235.588292, 169.302086, 379.667864, 151.384585, 265.08156]","[154.727614, 35.238919, 76.005194, 5.610541, 30.07196]",0.0,False,[] +gemini-2.5-pro,nginx-request-logging,5,"['f0ef115c-7434-4c6e-b7e9-c636519f3e05', '4a558285-b12b-41a1-b4db-6b634aaabadf', '28813d60-6bf7-48c0-b48b-2ff82aebd76f', 'f5d30300-ef64-4314-a244-eca820e84e93', '9bd077b3-0c98-40ba-9db8-c3f042dca5ba']","['nginx-request-logging__tcYfrPj', 'nginx-request-logging__6MZxnJT', 'nginx-request-logging__EbuaEQi', 'nginx-request-logging__ZdWa9Bs', 'nginx-request-logging__qqCoowX']",3,"[255.212445, 396.030978, 105.732398, 177.69263, 290.799818]","[161.968574, 34.147199, 21.754099, 20.554447, 47.510522]",0.6,True,"['f0ef115c-7434-4c6e-b7e9-c636519f3e05', '28813d60-6bf7-48c0-b48b-2ff82aebd76f', 'f5d30300-ef64-4314-a244-eca820e84e93']" +gemini-2.5-pro,openssl-selfsigned-cert,5,"['c2f1bbe8-98b5-42ce-acdb-7eaec0fe27f3', 'a6afc17a-ec75-4d7d-a800-1ae095eeede6', '2cd7ee00-e4e0-4b9b-93fb-a0a0927d830e', '880f477a-f11e-4e47-abda-9aecf2538b26', 'db9f55e6-862e-4cfd-a4c7-7314322cba78']","['openssl-selfsigned-cert__FtvRmgs', 'openssl-selfsigned-cert__zVUKFMv', 'openssl-selfsigned-cert__uaeeDao', 'openssl-selfsigned-cert__QzdPNsN', 'openssl-selfsigned-cert__V3B44fC']",3,"[148.691059, 204.034046, 145.991291, 187.011159, 283.026972]","[47.298945, 38.884216, 43.979853, 70.018457, 45.239708]",0.6,True,"['2cd7ee00-e4e0-4b9b-93fb-a0a0927d830e', '880f477a-f11e-4e47-abda-9aecf2538b26', 'db9f55e6-862e-4cfd-a4c7-7314322cba78']" +gemini-2.5-pro,password-recovery,5,"['12363f43-2d10-4ca4-81d1-9f8d53753b93', '78cd3ea7-1c3d-4adf-ac00-290cbf33e7b6', '01e7ea3d-e15d-44fd-a84d-1d33afeef2f6', 'ac754c85-be90-49e7-8647-43da78db4479', '69c5fa14-dca0-43e6-9729-ccd3d9ac5a6f']","['password-recovery__namovxN', 'password-recovery__aPrfvhr', 'password-recovery__BGgfqN2', 'password-recovery__B43Zi6t', 'password-recovery__KsqT5Xw']",0,"[1590.976104, 933.364235, 901.07837, 906.229453, 917.999784]","[80.643292, 19.494982, 260.035781, 55.34067, 41.084176]",0.0,False,[] +gemini-2.5-pro,path-tracing,5,"['b2c4efb1-f942-4c47-92ab-c68ee78a2121', '3be5bc00-4b96-4d4b-a7c2-b35028544c7b', '007eb065-a6d2-4bf2-b86b-4a43b29a50dc', '715f036e-2117-4c6f-8027-ad342faf6622', 'b6771c15-4778-4be2-80c1-bf3d36e89dc1']","['path-tracing__3JSUipG', 'path-tracing__bXH8iBa', 'path-tracing__XoJf8Gx', 'path-tracing__idcMtMw', 'path-tracing__6yqEqZY']",0,"[347.161579, 286.591562, 235.540327, 345.822348, 406.604805]","[62.731371, 15.275236, 16.570468, 14.040424, 24.172591]",0.0,False,[] +gemini-2.5-pro,path-tracing-reverse,5,"['88b81eb6-e2b1-49e1-8042-7a15cd8b2d09', '5d04e8a7-b826-4e79-840a-af4302fc43e2', '51edb7ae-065b-4b87-8b97-ca0ab23d0e58', 'e6e4c2ca-a0b8-4091-9195-f9446a5be443', 'b1e73074-87af-467f-9cf2-d38237429456']","['path-tracing-reverse__JPsJZVR', 'path-tracing-reverse__bpGZGW9', 'path-tracing-reverse__RstxBAP', 'path-tracing-reverse__M6FBVRq', 'path-tracing-reverse__fUdaQgz']",0,"[1835.024521, 1804.042435, 867.449715, 1844.497132, 575.791679]","[31.703453, 100.387613, 52.756021, 25.094139, 36.493489]",0.0,False,[] +gemini-2.5-pro,polyglot-c-py,5,"['734e3d25-3eb1-4c32-8619-dc372f72e124', '8f7b2626-e5bd-46e6-9a86-ac5425a89f9a', 'ca4278e7-3cea-411a-86cb-bac0d3ade1d9', '70a7a9c6-73bc-4892-abd9-7bd13f3dd568', '970c8cb4-52ad-428f-8bac-eea6bdf5c12a']","['polyglot-c-py__nshK6gT', 'polyglot-c-py__X5oaLHv', 'polyglot-c-py__7pKq225', 'polyglot-c-py__bbCZHoB', 'polyglot-c-py__92McudC']",1,"[90.301479, 151.89027, 346.035359, 188.919988, 214.833179]","[32.477083, 37.25521, 24.092183, 45.989481, 68.750446]",0.2,False,['70a7a9c6-73bc-4892-abd9-7bd13f3dd568'] +gemini-2.5-pro,polyglot-rust-c,5,"['07020d61-dab7-44d6-b40b-48781601f357', '0f06d7df-060d-40e6-89db-9a3eacf6194e', 'cf232c56-6d3c-4d64-bb1d-1c0d5617cabf', '8e6a5074-9071-4c97-aed6-4f2aeb388de6', '7fe3e457-630a-41b7-b9c7-d07b66991bf0']","['polyglot-rust-c__Rmxda8u', 'polyglot-rust-c__r84KatE', 'polyglot-rust-c__DDJd3rY', 'polyglot-rust-c__un4TzGn', 'polyglot-rust-c__ivWcBap']",0,"[959.010598, 424.089692, 297.3684, 909.72141, 544.45041]","[78.605298, 61.11081, 329.447323, 34.978883, 87.481235]",0.0,False,[] +gemini-2.5-pro,port-compressor,5,"['1186f2d0-79ef-4e0b-92a1-3f81921329d5', 'eca79742-1a0f-4013-bde1-c703fd850be0', '12cc21bc-0d8e-4675-964b-c67d323cf3e2', 'b379b986-867b-494f-a689-4593c27d383f', '2fe66311-4894-4249-96f9-916b8d440e1f']","['port-compressor__ucgDkF6', 'port-compressor__q2DKGjB', 'port-compressor__XH6ieDk', 'port-compressor__TiwbNgB', 'port-compressor__FGPYPv5']",0,"[3611.956151, 3600.001709, 3618.339634, 3564.083488, 3600.001435]","[75.287605, 96.838105, 50.274441, 97.41832, 39.056583]",0.0,False,[] +gemini-2.5-pro,prove-plus-comm,5,"['8e9968cb-4a93-4f72-9e8c-a205db4744f0', 'f23fff11-6f50-47e9-86f1-041580c2d253', 'e32be8d8-fd6b-4a05-b1ae-b3a3e7bdd55f', 'f8d7a257-9adb-4d09-93de-55cf1a6233ee', 'd8f40f19-62e5-495d-ba44-df6c68c1e940']","['prove-plus-comm__qKRo7Hb', 'prove-plus-comm__FaL2RCy', 'prove-plus-comm__f4tR8n7', 'prove-plus-comm__Lxfa3Y3', 'prove-plus-comm__TGABi8h']",4,"[330.444313, 240.055873, 227.05448, 383.148952, 900.049729]","[27.855685, 54.690602, 87.726794, 22.232052, 23.022602]",0.8,True,"['8e9968cb-4a93-4f72-9e8c-a205db4744f0', 'f23fff11-6f50-47e9-86f1-041580c2d253', 'e32be8d8-fd6b-4a05-b1ae-b3a3e7bdd55f', 'f8d7a257-9adb-4d09-93de-55cf1a6233ee']" +gemini-2.5-pro,pypi-server,5,"['a1563cd0-f27b-4475-acd3-bf58905e134c', '0a61f64c-9b82-48ab-b4c9-17faab102bca', '01d0bbdd-6daa-4b1d-9b79-544240346808', '1565a4e7-7ff6-4d47-abe5-8e095aef4f2a', '4cd4fa16-cdc0-4013-ab0e-e535fec3386f']","['pypi-server__zHAQ9X2', 'pypi-server__EWz9ueJ', 'pypi-server__vX9BUps', 'pypi-server__cSZHHL8', 'pypi-server__ZHGqDXT']",4,"[514.246346, 382.741979, 630.920116, 825.17696, 511.302286]","[18.396158, 101.141604, 77.049858, 72.546302, 36.423998]",0.8,True,"['a1563cd0-f27b-4475-acd3-bf58905e134c', '01d0bbdd-6daa-4b1d-9b79-544240346808', '1565a4e7-7ff6-4d47-abe5-8e095aef4f2a', '4cd4fa16-cdc0-4013-ab0e-e535fec3386f']" +gemini-2.5-pro,pytorch-model-cli,5,"['305db620-a680-43c3-a20f-77999cd2a3fc', '77ddeb19-484d-4669-a7f3-fc61f0353db2', '9a199c5d-afac-411f-a125-81d884303cc8', '220c858b-cb47-45b1-82b2-8ce0ea90e450', '8b4b606c-bceb-41b8-a19f-8a7c2281a790']","['pytorch-model-cli__LQzemK3', 'pytorch-model-cli__BsDD8NX', 'pytorch-model-cli__2rBNKTa', 'pytorch-model-cli__TjZjfUY', 'pytorch-model-cli__8myvDEG']",2,"[768.194992, 97.803647, 359.02534, 900.00787, 346.949304]","[63.632137, 96.464658, 131.060889, 63.945133, 45.122495]",0.4,False,"['305db620-a680-43c3-a20f-77999cd2a3fc', '220c858b-cb47-45b1-82b2-8ce0ea90e450']" +gemini-2.5-pro,pytorch-model-recovery,5,"['92ad4c47-85fb-4799-9501-d9a758ee09d9', '7f803f68-3bc2-4887-8159-f1d65b547847', '758dff0f-500d-43a1-863a-744a5ac2b0f1', '5ba4a7ec-fb21-42bb-8ad6-ab6fc457ad14', 'bbf9e4c6-c784-487b-b036-dbb5f4b80399']","['pytorch-model-recovery__tXE2Aco', 'pytorch-model-recovery__DuVTMzW', 'pytorch-model-recovery__iHLm36B', 'pytorch-model-recovery__ZDftNwr', 'pytorch-model-recovery__xCFC5wL']",5,"[447.808289, 874.427811, 275.47569, 303.492384, 910.228245]","[58.414777, 44.522361, 106.302854, 13.736145, 47.395366]",1.0,True,"['92ad4c47-85fb-4799-9501-d9a758ee09d9', '7f803f68-3bc2-4887-8159-f1d65b547847', '758dff0f-500d-43a1-863a-744a5ac2b0f1', '5ba4a7ec-fb21-42bb-8ad6-ab6fc457ad14', 'bbf9e4c6-c784-487b-b036-dbb5f4b80399']" +gemini-2.5-pro,qemu-alpine-ssh,5,"['ac7e5321-4a79-4c78-9fd4-fff9eaba21ba', '524f0260-b55b-4443-ab46-42601de929cc', 'bce7f833-aae9-449f-b3dd-e7f4973f4ebb', 'f7e2dd74-15c0-40fb-9086-cb62e62c85e8', '06e755b3-0d5a-4057-988e-3546ad18a8cb']","['qemu-alpine-ssh__PpWKWRx', 'qemu-alpine-ssh__Db2z4m3', 'qemu-alpine-ssh__TiG8D6z', 'qemu-alpine-ssh__4oLTn7A', 'qemu-alpine-ssh__h4AAc3y']",1,"[227.564224, 252.888384, 842.572021, 337.163325, 439.323477]","[10.624895, 9.746019, 9.135836, 50.563123, 8.877993]",0.2,False,['bce7f833-aae9-449f-b3dd-e7f4973f4ebb'] +gemini-2.5-pro,qemu-startup,5,"['3ee0e99c-ff76-460f-a80a-c7bc476c66cc', '9ff8ef43-236f-4611-9c9d-28df1836433b', '5538baed-4a30-4d58-912c-42fdf6c3cd1d', '8619524a-a35f-4bd3-81a0-71b169e5f072', '35e11fab-812d-4161-83f1-ab8c80a0f4e3']","['qemu-startup__pAS6sEP', 'qemu-startup__UH56rqp', 'qemu-startup__najeb3s', 'qemu-startup__nANVPef', 'qemu-startup__tpAXk8z']",1,"[456.28347, 106.833497, 198.950849, 89.109801, 214.303761]","[20.330798, 7.352791, 36.440284, 4.981015, 3.064059]",0.2,False,['3ee0e99c-ff76-460f-a80a-c7bc476c66cc'] +gemini-2.5-pro,regex-log,5,"['1c80a047-a419-419c-91be-b157b0827062', '4196183f-9885-4780-91c0-5569a87cd7b3', '05a8f0e7-3275-4e52-b132-059c3051163e', '47598924-df71-44ac-b3ba-74a78d0feef9', '0e50d050-c6a4-4b9d-b09c-c69a3dc137b1']","['regex-log__sk9d8Kn', 'regex-log__joZ8KXH', 'regex-log__JZVCrKL', 'regex-log__px8KgCM', 'regex-log__mLkq5PL']",4,"[141.182113, 109.631906, 219.624419, 201.023431, 107.855917]","[42.516863, 151.496137, 53.341727, 131.258738, 241.355087]",0.8,True,"['1c80a047-a419-419c-91be-b157b0827062', '4196183f-9885-4780-91c0-5569a87cd7b3', '05a8f0e7-3275-4e52-b132-059c3051163e', '47598924-df71-44ac-b3ba-74a78d0feef9']" +gemini-2.5-pro,reshard-c4-data,5,"['eb211567-6114-451a-a756-de4601439e6e', '05199fa2-cc1e-4201-bae0-6bf937da1b3c', '4c2f3126-31c8-4171-93c4-9751e7c410a8', 'b7ceec9f-a5d7-4d8a-8e72-389a7b6f57d5', 'feaebab0-3b67-47b9-93e9-28033d7cec5f']","['reshard-c4-data__ExxbGZo', 'reshard-c4-data__wkrnVXS', 'reshard-c4-data__yQu6aGz', 'reshard-c4-data__JwyWQUZ', 'reshard-c4-data__gkcDt7v']",0,"[280.366479, 514.007344, 554.952568, 274.800057, 242.309009]","[102.625757, 60.584029, 189.138681, 44.453644, 63.636199]",0.0,False,[] +gemini-2.5-pro,reverse-engineering,5,"['817d7850-7fe1-4421-ab53-57b16da14659', '71da4ddc-57ee-44be-9ec5-905d3db1cd68', '6448dab5-d962-4835-9f21-2ebf832e1c68', '2b29ddb6-ccea-4ba3-bd42-0108506e496f', '2a511ec9-bd36-4719-83f6-424e27fcff43']","['reverse-engineering__A5uuHPh', 'reverse-engineering__zRJb8MH', 'reverse-engineering__FwedYLq', 'reverse-engineering__aKBZdgx', 'reverse-engineering__jGPM4pA']",0,"[898.736955, 1828.588204, 1806.484505, 1803.890926, 1502.86234]","[11.100258, 22.098956, 48.589721, 52.444769, 46.151991]",0.0,False,[] +gemini-2.5-pro,run-pdp11-code,5,"['ae0878f6-36f5-4c1a-8f5d-6a9c723bee52', '0e35e7b5-4078-4351-aeb8-7b7fa71165a3', '4de074b7-1534-4b27-b38f-53ca493e3634', '1a57f12e-dacc-4078-ab30-3eb016ba3cec', 'e352fcac-0c21-40bc-a7ce-04c68b369378']","['run-pdp11-code__x9LvoTj', 'run-pdp11-code__LtWwQUy', 'run-pdp11-code__3eGKPaJ', 'run-pdp11-code__gSBdkQM', 'run-pdp11-code__vYVrpvu']",0,"[1123.358238, 1021.943654, 1000.576743, 399.718383, 1016.359131]","[86.46307, 62.354411, 19.182443, 24.961416, 38.960422]",0.0,False,[] +gemini-2.5-pro,sanitize-git-repo,5,"['e3234ee1-58a6-4294-a6a0-f096ac936ab3', '268318a5-a2ca-4f64-b5e3-33554cbd0807', '210af782-0274-40f2-8fd3-7c6e777b437e', '0f3f110a-3987-43ef-9774-6a0428e6a22e', '69454a0b-f518-4501-b003-ba26d9981629']","['sanitize-git-repo__HLsGH8z', 'sanitize-git-repo__KLJAYjH', 'sanitize-git-repo__UVd5MeV', 'sanitize-git-repo__GRMtm7e', 'sanitize-git-repo__6PHdX2k']",0,"[142.291642, 264.145468, 948.924235, 1176.674548, 268.295875]","[23.181219, 33.557054, 122.255618, 148.892877, 46.206828]",0.0,False,[] +gemini-2.5-pro,schemelike-metacircular-eval,4,"['208e5257-6ee2-4a92-8f8e-f68712fe9794', '69b2f840-f461-4cc1-94e7-276ef22ba627', 'c85b9d3f-fb1a-48a0-8406-da6aa1b5060d', 'ef888d92-2b9a-4917-baae-981f37e6f903']","['schemelike-metacircular-eval__9N9SESA', 'schemelike-metacircular-eval__Jvdtyap', 'schemelike-metacircular-eval__trRGDr3', 'schemelike-metacircular-eval__SxjBPzE']",0,"[1456.767477, 1263.391927, 2405.495779, 947.104285]","[96.617765, 92.156337, 96.54361, 43.909361]",0.0,False,[] +gemini-2.5-pro,sparql-university,5,"['08a2960c-f3db-4aca-a129-0affc8c1a792', '017ee42e-11a5-49c8-8e23-e9abfd41e5a1', 'ec0abb8c-d882-4b9a-8944-8bdfe6f664ec', '5efce481-8c38-4bb4-be18-543903df2a89', 'a17c6f0d-3aea-441b-918c-e1cf26e4bc26']","['sparql-university__EnpYPHX', 'sparql-university__kYEbZqJ', 'sparql-university__FRhDRHK', 'sparql-university__s8T7Vd8', 'sparql-university__h5dJ48B']",3,"[1011.935806, 197.260861, 127.174053, 113.766223, 271.966533]","[198.606059, 35.784065, 27.936427, 53.505058, 53.943713]",0.6,True,"['08a2960c-f3db-4aca-a129-0affc8c1a792', 'ec0abb8c-d882-4b9a-8944-8bdfe6f664ec', 'a17c6f0d-3aea-441b-918c-e1cf26e4bc26']" +gemini-2.5-pro,sqlite-db-truncate,5,"['fd2746ac-ebda-4090-b6f8-158ff3e5712a', '0946432d-d373-486b-816e-770ebdb4998b', 'd77ba50c-fa36-4768-b4f0-1c5e4ac1460b', '0ed143cf-2262-4005-91b6-c1d20a078995', '348f4ebb-349f-40f9-8910-7d2a667b86ec']","['sqlite-db-truncate__SwoS3Dy', 'sqlite-db-truncate__Kh8n87b', 'sqlite-db-truncate__V3NoU9k', 'sqlite-db-truncate__JdjjMss', 'sqlite-db-truncate__xR9FFZB']",0,"[498.972732, 742.907514, 203.311204, 357.585043, 228.332542]","[25.55365, 13.865175, 62.959615, 34.474499, 58.065581]",0.0,False,[] +gemini-2.5-pro,sqlite-with-gcov,5,"['5f99ceed-1b2d-4d59-95b1-1a6f66db194a', 'da21f184-3c41-4be5-ae08-b586a61cf701', 'b8b258dd-b1e0-459d-af32-020af83bf977', 'b32d0c50-0bbf-4c4c-8fe3-cf7ae0abf9b2', 'd2d868ce-b51e-465d-baca-98bfe4a941af']","['sqlite-with-gcov__eUcsz5s', 'sqlite-with-gcov__GULwHud', 'sqlite-with-gcov__zWEmMNY', 'sqlite-with-gcov__jVCWL8u', 'sqlite-with-gcov__uCnjuTJ']",4,"[431.608876, 263.09336, 319.10009, 432.938835, 329.945283]","[27.935673, 35.999735, 68.493124, 140.635966, 60.736468]",0.8,True,"['5f99ceed-1b2d-4d59-95b1-1a6f66db194a', 'da21f184-3c41-4be5-ae08-b586a61cf701', 'b32d0c50-0bbf-4c4c-8fe3-cf7ae0abf9b2', 'd2d868ce-b51e-465d-baca-98bfe4a941af']" +gemini-2.5-pro,torch-tensor-parallelism,5,"['25d527b3-f5fa-42b7-bb01-73df19023097', 'b37c917b-c336-4b4c-89b8-2c46c5227376', '0a58d159-718f-4974-abec-71ffa805d259', 'd270af73-c466-4b4f-987e-3f2fb5c5086a', '7dd0188d-e6b7-47ac-9e2f-9d2724e89ec7']","['torch-tensor-parallelism__w73tXav', 'torch-tensor-parallelism__PCzHL32', 'torch-tensor-parallelism__Qv6xxVr', 'torch-tensor-parallelism__xtqW3tn', 'torch-tensor-parallelism__VyaZjyv']",0,"[91.635433, 71.931027, 131.577036, 91.335838, 154.811466]","[21.248811, 33.117527, 37.647097, 19.854807, 41.496734]",0.0,False,[] +gemini-2.5-pro,train-fasttext,5,"['44584cfe-51c7-4710-a675-0f444937a90e', '020b5cc6-97bc-4df0-8135-4074a49e12e2', 'd8b301eb-5d59-425d-a649-589ae869175b', 'cd448acc-9fd1-456c-9528-3869a2eeb6e0', '8d442bcd-04d8-42aa-ad4e-834f00602a26']","['train-fasttext__Aj4FZ82', 'train-fasttext__Bnst4Qq', 'train-fasttext__7MWa89G', 'train-fasttext__Ty4aVZC', 'train-fasttext__ZD4JHFs']",0,"[3607.245154, 3609.482687, 3601.985707, 3601.220383, 1510.976587]","[70.141896, 19.271385, 84.642846, 154.234468, 20.771586]",0.0,False,[] +gemini-2.5-pro,tune-mjcf,5,"['25ecb3c8-99b2-4212-a3cc-4e8e3de85bce', 'd4a79710-cd0f-48dd-8310-b669e97563dc', 'f9e68490-a9b1-4bb1-bee3-e03564d23215', 'e85a7a39-5de6-4f26-9fc7-418f7cfcda46', '9c9fe6b9-b32d-42be-a9e6-971e95689235']","['tune-mjcf__M7jaL8f', 'tune-mjcf__zbG6QVx', 'tune-mjcf__4FpgiXG', 'tune-mjcf__7qo28Fy', 'tune-mjcf__C8bsxdW']",1,"[902.748268, 670.397557, 929.426821, 900.002714, 912.093685]","[15.10843, 9.984595, 18.476519, 23.170003, 18.833303]",0.2,False,['d4a79710-cd0f-48dd-8310-b669e97563dc'] +gemini-2.5-pro,video-processing,5,"['9678e0fd-cdbd-4070-b1e4-caf6ea18e362', 'f4e9d225-b058-4d23-8ade-0e0807db12b8', '8629563b-b5c9-4598-8c11-351a55eea5e5', '8b0afaf3-c1cb-47f7-978d-73841854dd25', '2de09c9a-22a0-49ff-9db9-61d2add03b76']","['video-processing__MGyj3vv', 'video-processing__5HHGqJh', 'video-processing__A9Umwce', 'video-processing__ZF5hURx', 'video-processing__Yga8K6k']",0,"[498.938253, 1271.858999, 168.156932, 621.493911, 301.453438]","[105.259283, 55.135159, 160.082356, 30.608606, 73.18509]",0.0,False,[] +gemini-2.5-pro,vulnerable-secret,5,"['7862f772-f0c0-4cd6-bc2a-8c572d18a41a', '11e3074d-709e-4241-923b-9d55a3e7789a', '710d6e3d-908f-4740-b092-fab2159d60fc', '5beba5f6-6e0e-4f19-b0d3-990df690dd62', 'b044de13-2f01-48b2-9006-4e2ed9783d5d']","['vulnerable-secret__u8aoRfu', 'vulnerable-secret__aPd6WTa', 'vulnerable-secret__evY7mHJ', 'vulnerable-secret__fPGQpHJ', 'vulnerable-secret__U7EjFvt']",4,"[649.110238, 254.776907, 840.93766, 236.203981, 901.357734]","[27.750839, 9.293861, 51.133779, 23.268562, 69.452779]",0.8,True,"['7862f772-f0c0-4cd6-bc2a-8c572d18a41a', '11e3074d-709e-4241-923b-9d55a3e7789a', '710d6e3d-908f-4740-b092-fab2159d60fc', '5beba5f6-6e0e-4f19-b0d3-990df690dd62']" +gemini-2.5-pro,wasm-pipeline,5,"['675fa499-2e18-4af8-85dd-0ce2f4a0ad59', '51221b1b-da66-43fe-972f-c28097569394', 'f787959a-c1fd-4758-80d5-67259eb0c4ec', '59e8ab15-2727-47bc-b462-17d43641a1a8', '2d534205-5b7c-49a3-82c4-4d22f8373a39']","['wasm-pipeline__cJ2fw7r', 'wasm-pipeline__WQP93zU', 'wasm-pipeline__treR92X', 'wasm-pipeline__5Nejmby', 'wasm-pipeline__TjSxj2s']",0,"[921.189737, 404.091312, 529.520143, 293.04408, 415.427435]","[8.110561, 20.538533, 5.518482, 6.302975, 8.262362]",0.0,False,[] +gemini-2.5-pro,winning-avg-corewars,5,"['7def81f5-d4e3-43d4-9ca2-d5e1f33541a8', '242f6209-f7ec-4701-b499-f2de0cea1931', 'd0dae0b3-3724-4764-a61c-8c7dbf72d512', 'b208c1fc-7482-4ea2-a46d-a94992e639fc', 'cc11a0a4-f69c-457e-b375-be95a3f2cda9']","['winning-avg-corewars__XYxKFHn', 'winning-avg-corewars__qEzzVtQ', 'winning-avg-corewars__bgHziZR', 'winning-avg-corewars__xnxRLkJ', 'winning-avg-corewars__CCZgFuc']",0,"[1339.260448, 3602.992949, 3606.094026, 3617.822027, 3601.276672]","[14.037068, 10.776633, 38.13438, 80.275281, 92.850937]",0.0,False,[] +gemini-2.5-pro,write-compressor,5,"['89d95090-6d65-43aa-bc9f-9d6c29cbdb51', '26388b9d-64e7-42c8-989d-79d21c95e205', 'ce28af1d-f127-4f80-81ee-c5d53ff81b0a', '5edce7e8-72f1-4666-838d-e83094cf8e6a', 'a8031f57-d582-45fb-8d75-88d73aeddbd8']","['write-compressor__sz9je8T', 'write-compressor__ZfzjKUz', 'write-compressor__rmBaYLp', 'write-compressor__hua2J2n', 'write-compressor__iLjzfsJ']",0,"[946.373119, 1454.964977, 930.475917, 920.16247, 904.423041]","[27.138827, 180.046302, 35.615782, 77.407149, 37.486424]",0.0,False,[] +gpt-5,adaptive-rejection-sampler,5,"['687c7370-6aef-4fef-90f1-94d1dda3e35e', '7d2b6597-4f90-48f0-873d-d9d842cdfb62', 'fdfc18b9-f834-45b2-b62f-56efca017ca7', 'ab27df81-2b05-45f4-ae2a-7ce61f570c33', 'adbc4e26-5096-4592-a5f7-7773a9a553a5']","['adaptive-rejection-sampler__Rj2XFYK', 'adaptive-rejection-sampler__QDUEBhe', 'adaptive-rejection-sampler__XibcUyp', 'adaptive-rejection-sampler__uRmUk36', 'adaptive-rejection-sampler__qxob8DT']",2,"[947.259483, 900.063841, 902.826155, 901.473466, 900.075567]","[65.090096, 59.375827, 105.093549, 121.767155, 96.403748]",0.4,False,"['7d2b6597-4f90-48f0-873d-d9d842cdfb62', 'adbc4e26-5096-4592-a5f7-7773a9a553a5']" +gpt-5,bn-fit-modify,6,"['dc0a9892-35d4-48b7-b7dc-d6839b616d36', 'f2602f60-a204-4ac5-8318-6a3af767cc98', '79c5d0ad-8a4e-4474-aee7-00feca5cf772', 'b75991f1-a1a4-49b8-a79d-fda46a16dd79', '422e1882-413a-4e65-b8e1-81fd9ac2859c', 'eb815c04-79f6-4e3c-97fd-73f163437195']","['bn-fit-modify__pKGvqpK', 'bn-fit-modify__Cgmijq6', 'bn-fit-modify__sL5YhyA', 'bn-fit-modify__xNKuKWd', 'bn-fit-modify__xY3ocPL', 'bn-fit-modify__RNk6sNE']",3,"[782.229744, 318.920008, 369.170403, 893.268747, 1151.545079, 663.819466]","[12.146497, 189.436042, 26.456918, 322.283488, 67.000069, 28.262767]",0.5,False,"['dc0a9892-35d4-48b7-b7dc-d6839b616d36', '79c5d0ad-8a4e-4474-aee7-00feca5cf772', 'b75991f1-a1a4-49b8-a79d-fda46a16dd79']" +gpt-5,break-filter-js-from-html,7,"['d5200423-de2e-409f-b3ad-204bc2d297fd', 'd439f183-792a-47ed-8907-72fd2367095f', '471a897c-ef65-47bc-a26d-f60139da84b6', '2c31ca6e-d20f-47f7-bb24-b24ba694b441', 'fee3a8fd-bfb6-4f94-bf0a-22c7d4f76eb6', 'c7c1f375-a11a-44fd-bb85-1ff5485c4f5b', 'f9fad111-60cc-45e5-97f4-d66e22b3f12a']","['break-filter-js-from-html__npeXtM9', 'break-filter-js-from-html__hHhd7Gj', 'break-filter-js-from-html__2zq5oCx', 'break-filter-js-from-html__AdsTxDX', 'break-filter-js-from-html__XoJAiJk', 'break-filter-js-from-html__TQ2cmbN', 'break-filter-js-from-html__Eu9efzH']",3,"[161.146064, 421.532825, 437.814998, 221.7925, 563.454374, 615.119177, 599.685202]","[15.133638, 97.328659, 12.966525, 6.361004, 7.165901, 39.944847, 79.651925]",0.42857142857142855,False,"['d439f183-792a-47ed-8907-72fd2367095f', 'c7c1f375-a11a-44fd-bb85-1ff5485c4f5b', 'f9fad111-60cc-45e5-97f4-d66e22b3f12a']" +gpt-5,build-cython-ext,6,"['7a2bf2b9-3b4c-43ca-86df-76c3df820431', 'f465839f-9d5d-493f-86ab-68a7290a1086', 'c3e27173-fb80-472d-8eb0-36b0f157a96e', '1d609737-7f44-4c78-8e59-e10c2ddde87f', '3eff1b3a-3c93-4a74-b83e-1818ba20c3c1', '7923a23e-9a79-453c-9a53-13bf733b0482']","['build-cython-ext__S89rYkx', 'build-cython-ext__AeJcYuJ', 'build-cython-ext__sfC2csb', 'build-cython-ext__m5qNqTS', 'build-cython-ext__5bUWphi', 'build-cython-ext__oo7SJqp']",0,"[923.773514, 900.004222, 900.031282, 911.364356, 953.928777, 900.471463]","[176.372658, 13.160192, 49.164417, 28.202652, 99.972918, 9.155067]",0.0,False,[] +gpt-5,build-initramfs-qemu,1,['21fb9e43-1658-4e4c-a923-d7735aabc3c2'],['build-initramfs-qemu__RDRopzT'],0,[929.613089],[39.362912],0.0,False,[] +gpt-5,build-pmars,5,"['2bde6e26-cef3-4c39-beec-af16e99dcea2', '478f169d-bf19-454b-9ef1-92823cfc118e', 'aaf2e8ee-6a7a-4aca-966d-71d622dba3de', '1aa25fb9-a79a-477b-b626-47ffc541a59f', '36b1a6c3-b6ec-4584-8b61-56df6d401b2a']","['build-pmars__ok8cfXs', 'build-pmars__bpRRSDh', 'build-pmars__PySxv5Y', 'build-pmars__by93HKK', 'build-pmars__H2qC2zz']",4,"[618.237492, 420.529629, 941.314624, 670.429353, 569.860484]","[5.174896, 5.036894, 15.337593, 4.794892, 41.452192]",0.8,True,"['2bde6e26-cef3-4c39-beec-af16e99dcea2', '478f169d-bf19-454b-9ef1-92823cfc118e', '1aa25fb9-a79a-477b-b626-47ffc541a59f', '36b1a6c3-b6ec-4584-8b61-56df6d401b2a']" +gpt-5,build-pov-ray,5,"['77741cd1-a259-4917-b33c-4dd85aae21cf', 'c6f2ae87-ba96-4961-b7f1-b79b1f0cde6b', '502f9f71-6539-468d-9d85-4d8825075884', 'caa748fc-ef61-44e1-8c2e-72f685681bd9', '3974277b-9ee3-49ba-95a3-e6ce60994f5b']","['build-pov-ray__BB9vxJ5', 'build-pov-ray__jDPtmKA', 'build-pov-ray__jtm5N4v', 'build-pov-ray__jfeBeio', 'build-pov-ray__zVETpsE']",0,"[4502.348002, 6000.096154, 693.824771, 1508.40576, 6000.001667]","[79.732767, 47.299542, 92.864631, 157.67983, 32.148175]",0.0,False,[] +gpt-5,cancel-async-tasks,5,"['e6454828-7cc7-476b-927e-e01c78d831c4', 'd7698122-e62a-4fe9-b957-7f78bc30e1d3', '583c8ec8-67df-453b-906f-ce43f79d7799', '15aead98-2744-4c83-ba52-3e1ff732c594', 'd879309a-4d8f-4aee-a7ae-f05d0f15b2c3']","['cancel-async-tasks__dzux7zG', 'cancel-async-tasks__VgoiuT5', 'cancel-async-tasks__ecSoUoG', 'cancel-async-tasks__GvfNBZW', 'cancel-async-tasks__fWDjdcL']",3,"[140.779789, 180.043629, 129.744433, 441.621822, 109.211802]","[49.460765, 76.660152, 51.867534, 336.546133, 105.372618]",0.6,True,"['e6454828-7cc7-476b-927e-e01c78d831c4', '583c8ec8-67df-453b-906f-ce43f79d7799', '15aead98-2744-4c83-ba52-3e1ff732c594']" +gpt-5,chess-best-move,7,"['c60cad39-d472-4511-bf76-1191ff3c6d33', '445d761f-0bf4-4e5d-ab0b-37c4a733164c', '51f85e02-5b15-4f3d-9f3d-0ebd155c377a', 'c052e71f-e15e-4d9c-bb70-4ff3600eca4e', '9bdf3eb5-4198-44d1-85f8-109fd136eedb', 'f6a6cef1-d9d8-4245-8f87-fb3f3f47e48e', '8bfbe760-e999-4237-b08f-db20f82a984d']","['chess-best-move__Ne3gRtV', 'chess-best-move__37AEcZv', 'chess-best-move__WrnnZ8R', 'chess-best-move__m5v5R3m', 'chess-best-move__GAWT8VP', 'chess-best-move__iQpT8kx', 'chess-best-move__S2ETy27']",0,"[900.114747, 901.844325, 924.433937, 900.000906, 900.001182, 902.477519, 794.407654]","[9.07527, 265.981811, 56.081178, 11.191537, 22.981045, 15.05337, 14.862108]",0.0,False,[] +gpt-5,circuit-fibsqrt,6,"['57b5a96c-276a-4199-ad96-d7759d0a4e32', 'c833fd31-f4be-4e47-9252-d13aa3acca2b', '6c00e278-fa95-4adc-ace8-273951085a72', '51ae7bb7-3812-4e30-927e-28bf4ff4cf62', 'e315bb79-60bf-451f-a47d-0622529a8ac6', '25824a37-eb61-493c-b671-4bb34c65278f']","['circuit-fibsqrt__HuLdVHU', 'circuit-fibsqrt__N7t8zRq', 'circuit-fibsqrt__MHj5S3g', 'circuit-fibsqrt__vGPGU3H', 'circuit-fibsqrt__xrDQpb9', 'circuit-fibsqrt__mmpTAf5']",4,"[3606.389434, 2806.007752, 1002.388623, 1431.365257, 2780.124129, 3631.903935]","[77.750532, 8.703196, 18.557783, 50.41308, 42.542621, 20.016183]",0.6666666666666666,True,"['c833fd31-f4be-4e47-9252-d13aa3acca2b', '6c00e278-fa95-4adc-ace8-273951085a72', '51ae7bb7-3812-4e30-927e-28bf4ff4cf62', 'e315bb79-60bf-451f-a47d-0622529a8ac6']" +gpt-5,cobol-modernization,6,"['a5ee2eba-2af4-44fe-9b12-69b3bce53268', '0515143d-404b-466a-a207-0a670edd5207', '98a1727a-fad1-4d7e-8d7f-ed570888d97a', 'b04e852e-417c-454f-a9f3-d281597c5bb9', '3069d20c-bed1-4b7b-8b71-385297a6c1ae', '10e26a28-f40f-49f6-8451-d10717827599']","['cobol-modernization__MVVn6L5', 'cobol-modernization__AAMYhBJ', 'cobol-modernization__8LKWdF9', 'cobol-modernization__Egcuc5C', 'cobol-modernization__G8bAYoy', 'cobol-modernization__xdNpJTV']",6,"[426.111141, 320.6472, 904.580499, 217.411476, 225.235422, 434.831796]","[19.63973, 10.631514, 106.187243, 12.104298, 50.184762, 54.115191]",1.0,True,"['a5ee2eba-2af4-44fe-9b12-69b3bce53268', '0515143d-404b-466a-a207-0a670edd5207', '98a1727a-fad1-4d7e-8d7f-ed570888d97a', 'b04e852e-417c-454f-a9f3-d281597c5bb9', '3069d20c-bed1-4b7b-8b71-385297a6c1ae', '10e26a28-f40f-49f6-8451-d10717827599']" +gpt-5,code-from-image,5,"['c0203012-10f5-4e91-9ad3-268898886a47', '286557fb-b1c1-44b2-abec-1bdf121651e0', 'baa7b454-08dc-40a5-a261-6046202442db', 'c0d80f87-7f30-487a-b3e2-5766600f742f', 'fa04e5ef-1582-4f5a-a06f-13209cd53795']","['code-from-image__qw2EjPf', 'code-from-image__e8oZkAs', 'code-from-image__BTxQovg', 'code-from-image__CRqGAoW', 'code-from-image__iGqu8yh']",2,"[1201.63056, 1200.001344, 1220.118122, 567.152112, 428.287744]","[51.876972, 79.384996, 217.359113, 69.271324, 16.024637]",0.4,False,"['c0d80f87-7f30-487a-b3e2-5766600f742f', 'fa04e5ef-1582-4f5a-a06f-13209cd53795']" +gpt-5,configure-git-webserver,6,"['2273405c-10d4-475c-a5de-f1815d335cd3', 'c464dd5f-0dd3-40cc-83fc-4322351e787f', '68d1e3dc-8936-4ec9-88d4-b0d3c066bfba', '582e389d-1c75-407d-8a52-ec9f34d09591', '74f9a8c6-854a-44a0-8c29-7611d07b3080', '294b6bf2-112b-46fd-8f94-3d053acd45ca']","['configure-git-webserver__ELNYJ2w', 'configure-git-webserver__ZjDfk4P', 'configure-git-webserver__dLM7dci', 'configure-git-webserver__zv2wPqv', 'configure-git-webserver__i5fTqHJ', 'configure-git-webserver__dPq4uwF']",6,"[145.150595, 651.456662, 778.7174, 367.7218, 584.741749, 686.346796]","[12.73458, 35.166313, 65.213501, 38.197522, 152.630794, 38.309222]",1.0,True,"['2273405c-10d4-475c-a5de-f1815d335cd3', 'c464dd5f-0dd3-40cc-83fc-4322351e787f', '68d1e3dc-8936-4ec9-88d4-b0d3c066bfba', '582e389d-1c75-407d-8a52-ec9f34d09591', '74f9a8c6-854a-44a0-8c29-7611d07b3080', '294b6bf2-112b-46fd-8f94-3d053acd45ca']" +gpt-5,constraints-scheduling,7,"['e44839c0-6f4c-47c7-8fb6-1042c44f9ba7', '71797a23-2aa0-4128-b87e-65488427ac58', '9adf687d-9e4b-4a7b-a3e3-1a7cedb106ad', '41dcdcd6-a2ae-43ae-9714-8ad88799b586', 'cb6167f6-5a39-4e8d-8579-506414cb37be', '8cdf973c-ce6d-41a8-8b6e-f61b8a5607fd', '66137536-1a88-40ad-8f67-72d64ed280be']","['constraints-scheduling__xQt8HUg', 'constraints-scheduling__ykiFCV7', 'constraints-scheduling__gGdaud7', 'constraints-scheduling__PNaxhry', 'constraints-scheduling__5yNJ6qF', 'constraints-scheduling__9SFhx74', 'constraints-scheduling__5z32nEW']",6,"[181.470067, 268.954183, 330.293856, 265.556712, 192.297308, 174.712709, 153.199702]","[81.850921, 79.984534, 81.579746, 71.556551, 13.357087, 12.664549, 11.98099]",0.8571428571428571,True,"['e44839c0-6f4c-47c7-8fb6-1042c44f9ba7', '71797a23-2aa0-4128-b87e-65488427ac58', '9adf687d-9e4b-4a7b-a3e3-1a7cedb106ad', '41dcdcd6-a2ae-43ae-9714-8ad88799b586', 'cb6167f6-5a39-4e8d-8579-506414cb37be', '66137536-1a88-40ad-8f67-72d64ed280be']" +gpt-5,count-dataset-tokens,6,"['a9104fa7-3fa9-422d-8f9a-af735310996c', 'd60e7b89-5170-4140-8897-2d9462402455', 'cbcce4de-0ee3-47a5-a9d8-0bcf92ddb92c', '802a0ccf-7dc4-47cf-91c2-5ccd9713cfc3', 'f913d927-aada-47cc-b8b5-1a3bf9f0749b', '8cf391f8-1562-4c0b-9ff3-740f02aff742']","['count-dataset-tokens__SRW83kj', 'count-dataset-tokens__4Jw2KaZ', 'count-dataset-tokens__WCPRTky', 'count-dataset-tokens__2L8baVu', 'count-dataset-tokens__Ue4cuPx', 'count-dataset-tokens__Bd83wtD']",1,"[516.552996, 663.083849, 650.136885, 900.418506, 668.834334, 915.590993]","[8.839998, 32.308258, 12.280382, 14.137497, 37.829523, 53.689987]",0.16666666666666666,False,['d60e7b89-5170-4140-8897-2d9462402455'] +gpt-5,crack-7z-hash,7,"['afc2284e-c651-4b9f-9a9a-11e1a11c4ed2', '5fcef6f5-c931-40e1-bb3a-c1fff033da31', '095634db-b3bd-4bae-aab7-d37d2155318d', 'aa577c68-82a4-4e92-beaf-6cd39e73dd1b', 'fb4b0c44-d06d-4c8b-94af-ca6f8836f660', '89d03271-11f3-40b7-8652-7811c87c74f8', 'c8918de4-af8f-42c7-b859-7f6048451477']","['crack-7z-hash__mhF6k7R', 'crack-7z-hash__wBfvSNx', 'crack-7z-hash__j5dZr4T', 'crack-7z-hash__fq6QXSs', 'crack-7z-hash__VeDUHNp', 'crack-7z-hash__Q7C7LMJ', 'crack-7z-hash__AeL5MfP']",3,"[544.140932, 140.127986, 735.296622, 693.078611, 900.001286, 868.820394, 56.775652]","[19.363334, 12.699971, 26.174252, 8.747214, 14.544173, 29.537457, 20.340346]",0.42857142857142855,False,"['afc2284e-c651-4b9f-9a9a-11e1a11c4ed2', '095634db-b3bd-4bae-aab7-d37d2155318d', '89d03271-11f3-40b7-8652-7811c87c74f8']" +gpt-5,db-wal-recovery,7,"['264f3b92-533b-43c2-af22-c2b5891928b6', '976bea3b-4536-4fcc-9723-2fc0d1cfd50b', '91e7e2f5-9bff-4120-b8ad-287df4753714', 'a3c98cf9-d56b-4fbc-9a8c-a8cfdb840c44', '95282df7-782c-4cd6-9a92-0a73ba18dd4b', 'dbba3f65-b266-4c37-aa6f-b6c915c8b4da', '0193f7f3-563d-4ca1-a35a-4b48ccbbe905']","['db-wal-recovery__iBH2rwU', 'db-wal-recovery__gMpG67a', 'db-wal-recovery__WMKsy8r', 'db-wal-recovery__C9TLdkn', 'db-wal-recovery__Bs9rBLQ', 'db-wal-recovery__q24a9Xj', 'db-wal-recovery__kajS8jd']",1,"[585.510196, 924.188288, 903.651288, 900.001769, 124.038376, 1014.428489, 915.504961]","[26.961274, 16.997902, 26.4765, 11.233638, 8.869277, 64.919731, 89.638595]",0.14285714285714285,False,['95282df7-782c-4cd6-9a92-0a73ba18dd4b'] +gpt-5,distribution-search,7,"['da36dc85-145e-40a8-aa8c-ca018763c3e4', '956f5e49-1099-4023-8aab-2b12bcf0a7d6', '3ceb6ac7-016e-4a9c-8d7e-f0fe68778ed2', '14e4c0e1-444e-49ef-8c94-0fca269d1437', '74226433-2b61-499f-9c66-61467bf2b2a1', '6e98b0d7-c3a4-4e48-9b46-c304e7f92aab', 'e759cfc1-86cb-4398-b354-11a6460c0214']","['distribution-search__hsdkztG', 'distribution-search__sEdSpKf', 'distribution-search__DzbWEgd', 'distribution-search__WQJoEa7', 'distribution-search__oSBNq2G', 'distribution-search__3n2jCgR', 'distribution-search__6DT4PtW']",7,"[327.497215, 272.605554, 148.571519, 608.0784, 255.047714, 450.929963, 148.92117]","[146.049372, 50.107973, 10.915835, 23.590333, 38.522244, 156.406897, 19.435894]",1.0,True,"['da36dc85-145e-40a8-aa8c-ca018763c3e4', '956f5e49-1099-4023-8aab-2b12bcf0a7d6', '3ceb6ac7-016e-4a9c-8d7e-f0fe68778ed2', '14e4c0e1-444e-49ef-8c94-0fca269d1437', '74226433-2b61-499f-9c66-61467bf2b2a1', '6e98b0d7-c3a4-4e48-9b46-c304e7f92aab', 'e759cfc1-86cb-4398-b354-11a6460c0214']" +gpt-5,dna-assembly,6,"['c4add67a-b81a-4dfa-a5e3-df08871b753d', 'eeb76996-1338-424c-9268-c8280da62777', '951447fb-2065-4e01-9858-d6ca408ff24f', 'd65c207d-655b-4b0b-a5db-bc54a871abc4', '6da7c904-8450-4224-b003-a73b3106c338', 'fc1d4edc-8bc6-4ce9-bfa4-9f090bc483af']","['dna-assembly__PYg9Soc', 'dna-assembly__X5uojvJ', 'dna-assembly__rg5PieE', 'dna-assembly__wAiSZJV', 'dna-assembly__Np2YV2p', 'dna-assembly__H9EgxsM']",0,"[666.00144, 777.441933, 724.760434, 720.031722, 750.654915, 747.223056]","[31.858785, 67.292686, 129.787704, 52.008669, 37.118579, 25.142205]",0.0,False,[] +gpt-5,dna-insert,6,"['1c80dd90-f60e-4da4-b241-9f2f60812750', 'a1a72053-dd64-4a8d-a0b9-183457c38182', '80ee59a5-1ed4-4853-825d-9067fad0e72d', 'eb17ff62-d0fd-49e6-820a-4a012b4ef4f2', '0df821ee-96c3-4a3d-9f11-d69aadecfbaf', '6dcc6a9f-9fdb-4505-a2a5-43521bfcbd9d']","['dna-insert__7d89WqV', 'dna-insert__xaRvSUF', 'dna-insert__68S4FDE', 'dna-insert__oLyKirk', 'dna-insert__5Nzq2hh', 'dna-insert__vVzfP67']",0,"[470.679608, 380.107128, 360.010782, 360.001225, 362.328948, 360.425853]","[35.795519, 30.062659, 38.555212, 17.437189, 48.380588, 73.406927]",0.0,False,[] +gpt-5,extract-elf,7,"['ec41e45d-2ebc-4705-b687-3d358466633d', 'ea916cad-d7d6-4e4c-9c65-695480f82964', 'a4c88d8d-cd05-4789-b7c9-bbb8c134b2a8', 'd09e362d-8bac-4f15-8c38-aea6f8bb3d68', '0c394b1a-a690-49f9-be61-cf37e6087d29', 'e28002c8-4c83-49a5-babc-4fad55afb951', '2103b800-0976-4145-8b02-6801e43d6ff5']","['extract-elf__Ttz9Kf8', 'extract-elf__jeCHzer', 'extract-elf__WqeazPk', 'extract-elf__F8GYgmM', 'extract-elf__dMgFRdS', 'extract-elf__E559k8j', 'extract-elf__YopgJgj']",2,"[189.579897, 216.97055, 558.509989, 114.179744, 303.231561, 198.657689, 105.844648]","[26.858638, 50.444566, 100.095715, 13.9943, 49.321635, 24.252616, 9.780107]",0.2857142857142857,False,"['ec41e45d-2ebc-4705-b687-3d358466633d', 'e28002c8-4c83-49a5-babc-4fad55afb951']" +gpt-5,feal-differential-cryptanalysis,5,"['8fba36f8-264b-48fa-b22c-5b693fe44c36', '452415ac-4965-4f39-998d-57cbbcc24b55', '91f654ec-4ff6-4ed0-9ae9-5ce504a14ad7', 'f7be1a8a-e68e-45d6-a540-1c50e2a391a1', 'dfbb884a-fa7f-416a-8531-27b400316d35']","['feal-differential-cryptanalysis__pKYjguW', 'feal-differential-cryptanalysis__9kKRvGV', 'feal-differential-cryptanalysis__fqQKfxK', 'feal-differential-cryptanalysis__gAxfWDY', 'feal-differential-cryptanalysis__chSpLHL']",0,"[527.229762, 460.952586, 523.144905, 982.667163, 428.680043]","[41.227842, 91.546101, 313.048167, 10.944871, 340.604771]",0.0,False,[] +gpt-5,feal-linear-cryptanalysis,7,"['b5e69394-6dd8-42d4-b61c-b943337d39c3', 'f913c078-a29f-4c0a-a0b5-0592cd51c8dd', '661c1ce4-03fd-4b3c-b569-a8214bb66519', '07d56ad8-ccef-4c2a-b468-80ee37717f98', '5fc4268a-d7fe-45d6-b59f-9cc28513dfc8', 'ae33265f-fab8-4850-abdf-1cfcd7174cfc', 'f7ddca7a-26e0-497c-acd3-929095841245']","['feal-linear-cryptanalysis__hUowkYQ', 'feal-linear-cryptanalysis__vQ4MH3V', 'feal-linear-cryptanalysis__YKKmnKP', 'feal-linear-cryptanalysis__SDWG4qw', 'feal-linear-cryptanalysis__qgssPkK', 'feal-linear-cryptanalysis__yY4whSJ', 'feal-linear-cryptanalysis__QN5jdcd']",7,"[908.290389, 656.289345, 1413.234163, 860.564152, 345.592296, 1599.371244, 887.480821]","[31.402331, 91.111483, 30.340901, 29.831587, 20.12171, 8.993617, 93.379735]",1.0,True,"['b5e69394-6dd8-42d4-b61c-b943337d39c3', 'f913c078-a29f-4c0a-a0b5-0592cd51c8dd', '661c1ce4-03fd-4b3c-b569-a8214bb66519', '07d56ad8-ccef-4c2a-b468-80ee37717f98', '5fc4268a-d7fe-45d6-b59f-9cc28513dfc8', 'ae33265f-fab8-4850-abdf-1cfcd7174cfc', 'f7ddca7a-26e0-497c-acd3-929095841245']" +gpt-5,filter-js-from-html,7,"['a3a35965-dc8f-4b86-ad1d-f79f00896bf8', '716eaecb-5fcf-4eb8-b9db-12cab2900664', '9abfad31-2161-46bb-9453-2d7059b2f9fd', '79c59929-1b11-4122-b5ea-d3564eba9bfa', '472a6762-ce4b-493d-bc5a-b0c35d9be076', '81384866-4394-4f78-a506-af497faf7496', '47a91cbb-d396-4a7f-afed-8bdfb316a431']","['filter-js-from-html__p96u6zz', 'filter-js-from-html__ed6p5qN', 'filter-js-from-html__wdU52UJ', 'filter-js-from-html__9HSuuXr', 'filter-js-from-html__JY672a2', 'filter-js-from-html__HHg43k3', 'filter-js-from-html__xHAqJSY']",0,"[361.536895, 246.87478, 513.369315, 190.504802, 390.710676, 296.645272, 124.138036]","[44.903613, 30.142108, 43.977028, 82.796899, 53.885869, 172.710727, 7.050967]",0.0,False,[] +gpt-5,financial-document-processor,6,"['0c90ba40-dfcb-49c4-8df6-644da427922f', '7a11441a-7a42-44d6-97b0-6b5bf8945f57', 'bf8b3f74-df47-4f3e-bcf5-1e83ab1abda5', 'fdd88afb-f22c-4dc6-9172-7c41dc25da59', '619cec56-9023-4590-92ee-2bc921101657', '27b29555-6dcf-4ae2-bf78-a4001bd1e92a']","['financial-document-processor__pd2zske', 'financial-document-processor__rjL4CDq', 'financial-document-processor__X4VEJyf', 'financial-document-processor__rzeAtHy', 'financial-document-processor__7khixGo', 'financial-document-processor__RN32gB8']",0,"[527.003723, 465.008393, 1259.580442, 955.653402, 609.575185, 457.32104]","[97.170713, 16.516862, 261.820097, 25.552764, 44.435925, 319.761173]",0.0,False,[] +gpt-5,fix-code-vulnerability,6,"['2ecbb0d2-527c-416d-80a3-a40bb6710cf5', '1bb86b23-70b7-4ded-92b8-42089a80a6c2', '10f2c158-abc1-4e84-9853-df0361ebd3ca', '6817506c-b19f-43fe-8762-be6d6931f15b', 'f7c6c392-41af-4392-a12c-23bbd3d24558', '8b3a085b-2cbb-4ca2-b074-f1b6685c76f8']","['fix-code-vulnerability__WXJ3nJF', 'fix-code-vulnerability__FBtyK5s', 'fix-code-vulnerability__CmGuh85', 'fix-code-vulnerability__Yf4EDQn', 'fix-code-vulnerability__mJmgMrD', 'fix-code-vulnerability__BGNmhnj']",0,"[902.279823, 902.000882, 911.885947, 901.991962, 900.000675, 1018.416899]","[85.506013, 73.749774, 41.424209, 4.653671, 2.180543, 11.397228]",0.0,False,[] +gpt-5,fix-git,7,"['fa2775ea-3e28-4a68-ba8b-6e0ef3ac5d87', '9573e490-64f2-499d-b7ed-c24a03122753', '80a0e56c-96ba-4eb9-b8f5-6c48ea4814bc', 'e3b9b919-ff1e-41ed-9cec-c249ff18ac4e', '771c770a-515c-4d1a-aa52-fc23621d9917', '0c53e65c-912b-478a-bd1f-fa4d78f3719b', 'e3bc1daf-d874-47c4-977d-9afc42706345']","['fix-git__RsK7cpN', 'fix-git__JbXBm2b', 'fix-git__LA7v2BC', 'fix-git__SRFeQkX', 'fix-git__GvnUoWK', 'fix-git__zVxMYKB', 'fix-git__iXekWB9']",7,"[435.026853, 267.159951, 110.055566, 268.257141, 152.242485, 137.151731, 138.027554]","[52.330139, 67.471635, 10.306406, 41.614713, 8.230076, 86.298567, 32.382884]",1.0,True,"['fa2775ea-3e28-4a68-ba8b-6e0ef3ac5d87', '9573e490-64f2-499d-b7ed-c24a03122753', '80a0e56c-96ba-4eb9-b8f5-6c48ea4814bc', 'e3b9b919-ff1e-41ed-9cec-c249ff18ac4e', '771c770a-515c-4d1a-aa52-fc23621d9917', '0c53e65c-912b-478a-bd1f-fa4d78f3719b', 'e3bc1daf-d874-47c4-977d-9afc42706345']" +gpt-5,fix-ocaml-gc,6,"['6d78f7f4-c47b-4ef8-bd35-af7adb9617fe', 'bbbac5dd-e18f-4881-9561-68e14c072e9c', 'ba67c269-687a-4dc4-9de7-906e447f9713', '507be476-27a6-4de9-822b-72a86043bdcd', '2ffd3819-f3cc-41e8-8090-851fceb5b36d', '1d6a1188-f00f-4522-a9c4-db252d7759b3']","['fix-ocaml-gc__EoN8hf2', 'fix-ocaml-gc__4PBcQoP', 'fix-ocaml-gc__VWqoAAv', 'fix-ocaml-gc__whhd332', 'fix-ocaml-gc__KQXNwkK', 'fix-ocaml-gc__q94MPyH']",0,"[3604.829114, 3600.019834, 3627.691823, 3607.458276, 3600.790072, 3600.002266]","[60.569386, 81.880765, 48.135116, 67.85194, 243.452406, 13.970946]",0.0,False,[] +gpt-5,form-filling,5,"['2a260166-61f0-4fce-b463-4ff9e962dfc6', '4eb85de0-9c15-4f90-9c4b-8ba3a150dca7', '9718e6fe-22ba-4edd-87e3-ef73453b249e', '5a7417fe-a88b-42d5-b6a5-7b01d32763c6', '7f2a3c75-8849-4a30-85e1-4f2b58c10622']","['form-filling__DiDzcSK', 'form-filling__NCg3eF4', 'form-filling__i6o5pim', 'form-filling__grkwgEz', 'form-filling__igJY4Fq']",4,"[568.057126, 541.252707, 905.86045, 665.346979, 579.442688]","[59.973684, 9.919524, 6.931635, 9.323126, 14.244631]",0.8,True,"['2a260166-61f0-4fce-b463-4ff9e962dfc6', '4eb85de0-9c15-4f90-9c4b-8ba3a150dca7', '5a7417fe-a88b-42d5-b6a5-7b01d32763c6', '7f2a3c75-8849-4a30-85e1-4f2b58c10622']" +gpt-5,git-leak-recovery,7,"['1d01d2fa-42fd-4fc5-b808-38af1c5778c0', 'a68fb259-b4ef-4aca-ae0c-4907817dd7d3', '5f5500ce-d56c-42ec-8114-7abb5398645c', 'ad13e37e-e085-4132-bbc2-427204da9faa', '021d5735-c51b-41ac-aa15-5f8f320f0b52', 'd60b7f97-eb79-4057-8ca9-9abe9b9db591', 'f12084c2-0ae4-4b65-8270-751f35512c80']","['git-leak-recovery__w6gTD4y', 'git-leak-recovery__EHcjnav', 'git-leak-recovery__TsToFWG', 'git-leak-recovery__5WHh6Yr', 'git-leak-recovery__BfY5m9T', 'git-leak-recovery__weByehk', 'git-leak-recovery__eUPWpRf']",5,"[280.969164, 293.401903, 901.331757, 208.594188, 900.001982, 109.092514, 87.398418]","[56.846194, 68.145412, 23.102632, 42.106323, 27.247811, 21.38778, 16.358533]",0.7142857142857143,True,"['1d01d2fa-42fd-4fc5-b808-38af1c5778c0', 'a68fb259-b4ef-4aca-ae0c-4907817dd7d3', 'ad13e37e-e085-4132-bbc2-427204da9faa', 'd60b7f97-eb79-4057-8ca9-9abe9b9db591', 'f12084c2-0ae4-4b65-8270-751f35512c80']" +gpt-5,gpt2-codegolf,5,"['92461c80-eb60-482c-bb55-2bcc11051e5d', '0c28f9c0-dec1-4d7b-a172-f819173a3ceb', 'ba624593-febe-42ae-a91f-334a70e333ca', '59c76845-2ee2-4c71-8fc1-8fbbc5eeb900', 'd2954d13-0729-4b1b-b746-c5e04668ebbe']","['gpt2-codegolf__cZF7cSA', 'gpt2-codegolf__8ZUHRDU', 'gpt2-codegolf__xHdkVbv', 'gpt2-codegolf__77oXroZ', 'gpt2-codegolf__q6Em9pb']",0,"[900.014797, 795.122958, 990.828439, 909.627104, 906.57832]","[238.873664, 114.2696, 65.765675, 15.769505, 38.027421]",0.0,False,[] +gpt-5,hf-model-inference,6,"['c935f7f6-6819-4116-a924-6ff5558d5ee0', '034010f8-5d38-4119-b596-c4a1e25a8cc6', 'b120f3bf-a8ca-4024-9e62-64e5d9e28946', 'ec5caf4f-3214-49ad-a838-4bcda768beb0', 'b85e18c9-f2b9-4a47-a3b9-b3f50ae506ff', '2066effb-4566-4842-b5a4-fd59b2d34d01']","['hf-model-inference__gxBhQfN', 'hf-model-inference__4dKxrHw', 'hf-model-inference__LeYF65q', 'hf-model-inference__9hgKi2D', 'hf-model-inference__3CtqyMc', 'hf-model-inference__nXWYSav']",6,"[170.313113, 304.240438, 312.829563, 385.184219, 643.153518, 441.130385]","[9.021081, 79.634151, 32.20607, 38.27839, 77.146419, 24.983522]",1.0,True,"['c935f7f6-6819-4116-a924-6ff5558d5ee0', '034010f8-5d38-4119-b596-c4a1e25a8cc6', 'b120f3bf-a8ca-4024-9e62-64e5d9e28946', 'ec5caf4f-3214-49ad-a838-4bcda768beb0', 'b85e18c9-f2b9-4a47-a3b9-b3f50ae506ff', '2066effb-4566-4842-b5a4-fd59b2d34d01']" +gpt-5,install-klee-minimal,6,"['a3063373-c247-457e-a89d-3a401eec3143', 'f1755a39-6fc2-48d5-83db-ee773c79f222', 'e27c1749-6550-41a1-8151-1e6ed40f2243', 'd0a47b4a-6eff-422f-ad93-b6a7a215b0e7', '149e1f1d-29c5-4b3b-b165-6f22abc80bc5', '3d875769-e80b-4552-8b32-ad26630e8cb0']","['install-klee-minimal__8yXFBKf', 'install-klee-minimal__mrfqK5f', 'install-klee-minimal__2UPy3Gy', 'install-klee-minimal__8Jkt2bJ', 'install-klee-minimal__8joiRDc', 'install-klee-minimal__uhkFdo8']",0,"[900.007161, 900.000697, 901.908794, 900.064479, 900.153186, 900.057718]","[12.072201, 222.288946, 34.553265, 79.024892, 59.835953, 76.187057]",0.0,False,[] +gpt-5,install-windows-3.11,5,"['09331612-af95-462e-9ac8-84f8401c065b', 'b0adb040-ac27-4b1c-bb74-26ab77a88328', 'b2f19a2d-2518-4456-8333-b4046c3d407c', 'ed7cd3da-e642-4230-85b9-b4aa1476f314', 'dea1b982-98d8-4ad7-87b9-56a13f6dfb08']","['install-windows-3.11__HHiBZVT', 'install-windows-3.11__Km6eD3s', 'install-windows-3.11__osxJ2Xc', 'install-windows-3.11__LtcMcTZ', 'install-windows-3.11__BhYUhfJ']",0,"[290.538304, 1094.848031, 259.88754, 467.275171, 227.360665]","[62.711546, 17.495974, 22.801317, 37.238749, 42.342651]",0.0,False,[] +gpt-5,large-scale-text-editing,7,"['568fdf21-3941-49db-b68c-3196a84d4a05', '38448196-935c-445d-ab11-3e4b713f8da0', 'c3ed9aa9-f28c-4821-a5f0-60a121704ce1', 'bb812fde-9294-4228-9db7-fa72b3b96fde', '44b5a656-d655-4031-8d57-c5e7afb47324', 'fec4817a-e77d-44b2-b74b-d9ae33b124a4', '043b8d8f-829a-4edd-b60a-5749ba6f787e']","['large-scale-text-editing__hCPsZmh', 'large-scale-text-editing__A2dtxLC', 'large-scale-text-editing__uePXC23', 'large-scale-text-editing__uNbhV8q', 'large-scale-text-editing__tJSDiEs', 'large-scale-text-editing__kzZ9Woe', 'large-scale-text-editing__CrmeGUd']",3,"[164.122586, 1241.365031, 370.535239, 1205.311247, 908.91406, 148.21879, 488.383421]","[12.328154, 11.732307, 24.976196, 252.624553, 25.155767, 11.049099, 98.149022]",0.42857142857142855,False,"['568fdf21-3941-49db-b68c-3196a84d4a05', 'c3ed9aa9-f28c-4821-a5f0-60a121704ce1', 'fec4817a-e77d-44b2-b74b-d9ae33b124a4']" +gpt-5,largest-eigenval,5,"['e037d264-15df-4063-90eb-a7a3e4749ac1', 'b5e793d0-8715-420f-a90b-a7c1cf8cec6a', '1441cf57-e3c0-4c64-8093-b9fbf698a10b', '362279f4-044f-4901-89ba-2da02544265a', 'ee1c0775-dcae-4cba-af17-351ab32299c4']","['largest-eigenval__BhmXzK2', 'largest-eigenval__ZENJoDv', 'largest-eigenval__YbzbFRV', 'largest-eigenval__in2EAEL', 'largest-eigenval__57dxn37']",0,"[915.411873, 725.332873, 900.088639, 913.914877, 906.5192]","[46.361913, 32.590278, 200.034603, 70.762171, 155.115216]",0.0,False,[] +gpt-5,log-summary-date-ranges,7,"['c6eba79c-375a-4a82-b0d0-2e34e1e30e1f', '8863cd87-0e4c-464e-b33e-c2fe56704274', 'bee2c417-be6a-4319-a1e1-3895a2989929', '68797e4d-8a6a-4d44-a779-a4ae5dc9e94c', '1d797159-d8ee-4ff3-907b-82bdc431a0d4', 'c2f65f40-7989-4c11-b809-9bd92f8e882e', 'b1329b7c-a036-496d-aa49-f73af5b23cce']","['log-summary-date-ranges__nyiArf6', 'log-summary-date-ranges__QzhKufJ', 'log-summary-date-ranges__SscWDtQ', 'log-summary-date-ranges__SvJ7xnC', 'log-summary-date-ranges__53ozNLs', 'log-summary-date-ranges__rsdtXRT', 'log-summary-date-ranges__HXoMTWs']",0,"[203.376941, 109.220249, 141.897095, 111.243658, 273.448434, 140.757486, 56.137735]","[135.024381, 23.906896, 9.005348, 31.931698, 162.043262, 22.38043, 22.023146]",0.0,False,[] +gpt-5,make-doom-for-mips,7,"['fb19a7eb-c94a-4961-9628-b9095bb41d22', 'f83541b9-5792-4a60-a39a-b34d5941031c', 'b87d4f01-67da-404e-a6b1-cd464ef4e8fb', '1e21f7c9-b966-4bd0-b874-3775bddaf2b1', 'a108b9a0-292e-4e37-8760-48a66deff06d', '59e6fd84-ac60-4260-b93e-6425f778a558', 'f931da19-2f56-4f8e-8f56-dc173a1ddd4a']","['make-doom-for-mips__FQyJYmV', 'make-doom-for-mips__p72S3Cg', 'make-doom-for-mips__vjurx59', 'make-doom-for-mips__F6g95sN', 'make-doom-for-mips__pVxSq8h', 'make-doom-for-mips__A5QdUcA', 'make-doom-for-mips__ybAzQGJ']",0,"[900.011283, 902.386841, 900.033643, 900.002286, 906.463231, 900.659976, 900.000973]","[226.151447, 13.10828, 51.757343, 8.129091, 38.250339, 48.043722, 9.074462]",0.0,False,[] +gpt-5,make-mips-interpreter,6,"['ece24654-de34-4d17-8f2b-105a75802be4', '899c39df-0934-409f-bef2-82c3a3f6cf5d', '6bafa982-1d1f-4c1d-8a4a-69a934c4bd71', 'bc7ef71c-06b2-48df-9499-f36a9d76e93b', 'c8fe452a-3a6a-45ee-a35f-df55603648f5', 'fe991bdd-e5a8-4979-aefb-ae37e97f08eb']","['make-mips-interpreter__SfzDtzX', 'make-mips-interpreter__vXnYzSz', 'make-mips-interpreter__iy6yTt7', 'make-mips-interpreter__uhWnmbL', 'make-mips-interpreter__d4UvDkb', 'make-mips-interpreter__hh9QeWi']",0,"[1820.739403, 1800.00051, 1809.734291, 1800.206438, 1801.337443, 1800.001333]","[20.95528, 31.32004, 197.156812, 56.767664, 31.205366, 6.011888]",0.0,False,[] +gpt-5,merge-diff-arc-agi-task,7,"['36b00af7-a0f8-49c5-993d-b1a1fd35beb0', '985d75a0-5a87-4fa4-a136-910a8413bb30', '8ffd3460-8727-4288-8c4c-f07d37e44734', 'f1f8230d-cf05-4c87-b67a-b9ffe6236233', 'c1c5b36c-b26f-40fa-9537-95af9172895a', '9e91ce44-e2b8-48cf-9824-c0284b67194a', '7882256a-af1c-4a07-a2c2-7af24d13189f']","['merge-diff-arc-agi-task__2VPBZpL', 'merge-diff-arc-agi-task__YAsZgbj', 'merge-diff-arc-agi-task__4PJEDah', 'merge-diff-arc-agi-task__dogE589', 'merge-diff-arc-agi-task__MNkbUJe', 'merge-diff-arc-agi-task__HfmWCse', 'merge-diff-arc-agi-task__2FyoVfJ']",7,"[254.343024, 524.795835, 755.773528, 502.368781, 443.221105, 412.923203, 552.292243]","[20.142096, 14.858028, 17.283049, 19.244743, 17.129905, 30.526098, 15.646848]",1.0,True,"['36b00af7-a0f8-49c5-993d-b1a1fd35beb0', '985d75a0-5a87-4fa4-a136-910a8413bb30', '8ffd3460-8727-4288-8c4c-f07d37e44734', 'f1f8230d-cf05-4c87-b67a-b9ffe6236233', 'c1c5b36c-b26f-40fa-9537-95af9172895a', '9e91ce44-e2b8-48cf-9824-c0284b67194a', '7882256a-af1c-4a07-a2c2-7af24d13189f']" +gpt-5,model-extraction-relu-logits,6,"['7cfa567b-4e73-46e0-b0e2-837968b4c4ac', 'ece7e9bc-7f65-4019-8991-e8c7a22a0796', '7ddc7bbe-58aa-472c-a4ec-ee7e06259bbc', '19d78783-7ac0-43f9-8e60-146d6c189d7e', 'c5ca9c96-de52-4df6-8361-616a2058f7a0', '9868a0db-11cd-4002-86ba-816516162219']","['model-extraction-relu-logits__d9eQFdt', 'model-extraction-relu-logits__QQB3JBq', 'model-extraction-relu-logits__SmvYPDB', 'model-extraction-relu-logits__udGz9sZ', 'model-extraction-relu-logits__6MiMiW5', 'model-extraction-relu-logits__3D5jzpT']",1,"[292.679044, 96.777411, 137.309111, 495.980032, 316.262251, 777.806328]","[8.948005, 31.03131, 20.911405, 72.226962, 9.471818, 103.613313]",0.16666666666666666,False,['7ddc7bbe-58aa-472c-a4ec-ee7e06259bbc'] +gpt-5,mteb-leaderboard,5,"['05ff8ea1-61c4-4641-b55e-aa6c64e64095', 'bc534b5c-5edc-4565-a997-d1064d098903', '84465b91-466d-4629-90fc-96ac86b42d19', '4e02c6f8-3e1e-487e-a557-7a164bf22323', '58dd69a3-14f0-4311-9466-25351a5871e1']","['mteb-leaderboard__GwnUnD7', 'mteb-leaderboard__UMAwg8P', 'mteb-leaderboard__qakxoVK', 'mteb-leaderboard__hiia5TW', 'mteb-leaderboard__8TqzbW9']",0,"[1002.181577, 2711.199834, 765.773785, 965.411028, 3193.466254]","[5.132226, 38.918911, 3.296357, 117.126333, 4.042383]",0.0,False,[] +gpt-5,mteb-retrieve,6,"['26bf9181-ac63-4d87-b8bf-acecea5eb090', '574c6244-981c-4f31-8029-f42e33a8f24c', '2ef28364-d183-4268-bc32-6ed4c27ffc21', '867ebf83-d157-4139-b30e-b983d7fb42e6', '269e2288-f545-497e-98a6-318d1b2a1cfb', 'bf0a7563-be09-460b-b693-c4d97dc2de75']","['mteb-retrieve__5hp3yu8', 'mteb-retrieve__gPZdGRG', 'mteb-retrieve__VHpBTDP', 'mteb-retrieve__FjFwoK4', 'mteb-retrieve__qVW7kAn', 'mteb-retrieve__XFMkR53']",0,"[315.698627, 276.970491, 187.925343, 118.223015, 316.201927, 215.725581]","[36.741265, 137.869488, 24.858108, 8.807723, 3.528326, 2.099594]",0.0,False,[] +gpt-5,nginx-request-logging,6,"['e903a8f8-0616-4a61-8bcd-e9b1243ead70', 'b6271fa9-0d5f-4238-84a7-888844ca4a1f', '1091c897-9654-4089-9768-38fc36b93809', '1fd89e02-aeb6-4c55-b52c-159ec614e3ef', '6b3efbe6-cfe3-4ad1-a0cf-d2c822395dae', 'f1899341-b1ba-4c56-b669-3b3a8450598f']","['nginx-request-logging__zTka35c', 'nginx-request-logging__EtFEV5c', 'nginx-request-logging__svSyVSM', 'nginx-request-logging__eGhEtzM', 'nginx-request-logging__Cb2ZuCZ', 'nginx-request-logging__NZnALLi']",6,"[287.752694, 180.570738, 197.444026, 504.06337, 193.951082, 148.27305]","[43.3071, 9.029903, 49.687537, 18.746825, 28.497858, 34.498012]",1.0,True,"['e903a8f8-0616-4a61-8bcd-e9b1243ead70', 'b6271fa9-0d5f-4238-84a7-888844ca4a1f', '1091c897-9654-4089-9768-38fc36b93809', '1fd89e02-aeb6-4c55-b52c-159ec614e3ef', '6b3efbe6-cfe3-4ad1-a0cf-d2c822395dae', 'f1899341-b1ba-4c56-b669-3b3a8450598f']" +gpt-5,openssl-selfsigned-cert,6,"['7651f3ee-ab0d-433f-8810-8305f3535ac8', '2f1bded6-3414-4bbc-af0c-4b827ae50b49', '71586f18-147f-4470-af96-cd90279d7797', 'd6ee15ac-03ea-4629-b73d-e7bc053282c9', '5a60ec64-138d-4db9-baaf-0ea2af61f9b3', '9dcfb3ed-3277-4faa-9b83-785e1ea23455']","['openssl-selfsigned-cert__V2piWiC', 'openssl-selfsigned-cert__rsMAauT', 'openssl-selfsigned-cert__7BsSHqe', 'openssl-selfsigned-cert__3pEsLVL', 'openssl-selfsigned-cert__VUuWwu3', 'openssl-selfsigned-cert__sbKNXcL']",6,"[111.747008, 134.891475, 161.294279, 94.043205, 121.959776, 124.957272]","[13.125941, 118.336448, 22.875472, 76.484224, 1522.549006, 8.908719]",1.0,True,"['7651f3ee-ab0d-433f-8810-8305f3535ac8', '2f1bded6-3414-4bbc-af0c-4b827ae50b49', '71586f18-147f-4470-af96-cd90279d7797', 'd6ee15ac-03ea-4629-b73d-e7bc053282c9', '5a60ec64-138d-4db9-baaf-0ea2af61f9b3', '9dcfb3ed-3277-4faa-9b83-785e1ea23455']" +gpt-5,password-recovery,7,"['1ebdd63c-1eaa-495d-9f3a-1db36cea5b62', 'b05e161c-a86d-4936-ab9c-6ba23a95fe79', '952cc713-1d2f-4139-bea0-8b94b5d99e77', '87e81dc7-3412-4fa2-aeaf-24262ad9255a', 'cab09fd3-8155-49eb-8a7c-415df5bb7f3c', '94ae7aa9-63c3-4d89-a617-e7f579f290d9', '3e8237d5-c0a5-468e-a9c9-c31bd18b6cc6']","['password-recovery__H7gWExV', 'password-recovery__5ANuugU', 'password-recovery__k2sn4cr', 'password-recovery__RogXs9s', 'password-recovery__MPKGLza', 'password-recovery__SLiDY5H', 'password-recovery__zjfWKQz']",0,"[907.806038, 901.586461, 900.702539, 900.001847, 900.427213, 1549.838791, 900.329749]","[16.873778, 13.555377, 42.355092, 12.559203, 38.486535, 160.667795, 23.384541]",0.0,False,[] +gpt-5,path-tracing,6,"['f4a58f67-209f-491e-9390-6e8faaed0192', '68b616a2-5897-4f6a-8e3e-779f95e1bcc8', 'd34bf7d6-1b8c-45c3-bc20-41884ae6f456', '274d8dd5-1bcf-4e85-9a23-e960479a9d73', 'c95796cc-2261-42ee-a40d-583910b10742', 'e3b87aaa-7450-4898-9284-cc3736de5902']","['path-tracing__VcNpQaR', 'path-tracing__xHoSiVi', 'path-tracing__oiNifJJ', 'path-tracing__RSK4UHi', 'path-tracing__Jcj2AAA', 'path-tracing__pREyFNo']",0,"[6611.720919, 1800.009502, 1854.889349, 1802.085791, 1056.51882, 1752.015862]","[40.862321, 10.414413, 7.626756, 36.517281, 88.3262, 86.40628]",0.0,False,[] +gpt-5,path-tracing-reverse,7,"['f3f3304f-7e65-4bfd-8f58-cf6c88a4e9f0', '11011d35-bc84-4e16-8968-39f29c8348e1', 'f8061f3b-ea90-4563-99ec-cfffe1e2ecbb', 'c68de3c6-c698-4e36-8317-9be7d35d104b', 'feac42a9-c1b0-4606-a946-91a8c1903182', 'e2cc54f9-880a-4947-a064-0813b8257e89', 'f200fe6d-e561-4b0e-9776-795ea77562b7']","['path-tracing-reverse__Ngr43zP', 'path-tracing-reverse__ofSGKDK', 'path-tracing-reverse__M5yXGbW', 'path-tracing-reverse__2dQyLZ9', 'path-tracing-reverse__5PzeDhB', 'path-tracing-reverse__fHzEcQC', 'path-tracing-reverse__bEzqY4B']",0,"[852.630629, 440.426682, 1860.210053, 1800.000693, 733.933442, 1019.723959, 1800.005368]","[74.109825, 77.45175, 44.98426, 16.36787, 16.033242, 141.017426, 10.217642]",0.0,False,[] +gpt-5,polyglot-c-py,6,"['2b10c226-9066-4427-9cba-04d42132dc88', 'ea8b6f01-a531-4a8f-96ba-24eaa49ef8ab', '1150d6b4-3ff6-45d9-af5a-c148d2306177', '4d8de6e7-5262-4ea5-8498-ef980d13e314', 'df04bd56-91b2-4f37-9997-3a6974ca55a5', '83c5abf6-350b-4f37-9a8e-7f16bbde3d10']","['polyglot-c-py__xKgdCnP', 'polyglot-c-py__cvA76Zc', 'polyglot-c-py__DDmjwfC', 'polyglot-c-py__bV6fFWF', 'polyglot-c-py__NeJEXAw', 'polyglot-c-py__2B3uefv']",0,"[281.662106, 663.855689, 145.604507, 215.933267, 812.535531, 257.753256]","[14.615036, 16.38993, 16.010054, 19.485151, 34.565562, 21.317161]",0.0,False,[] +gpt-5,polyglot-rust-c,6,"['170f4cfc-67c0-4bae-b338-b454fa9c9dd0', 'e5c89fd6-b828-4922-958c-6445b54e0699', '5b89640d-4b7e-4772-b805-39d81caa017e', '965c1989-f3ea-442d-84dc-ef826bf10709', '423786cc-527b-4470-9401-4ea11ad5623e', '7e11a645-31b9-4cff-915c-405d5ea398a6']","['polyglot-rust-c__WQ2ZAZm', 'polyglot-rust-c__wAeA6vC', 'polyglot-rust-c__j5PCTYM', 'polyglot-rust-c__JGd6BBV', 'polyglot-rust-c__QgWtDKr', 'polyglot-rust-c__X3xVTg6']",0,"[921.104387, 938.261047, 900.007167, 900.113803, 900.436422, 902.240164]","[78.347823, 158.751408, 17.772359, 23.416558, 129.365199, 46.037392]",0.0,False,[] +gpt-5,port-compressor,4,"['21af24ea-410b-4846-98cc-d6e5258f1c09', 'c937d52b-1a16-47af-8f78-8969f2a22df9', '87b22db2-265d-45f7-b9f4-223e7a92e3cc', '50965709-97d7-4995-a683-704f5a852afd']","['port-compressor__aMpJ95G', 'port-compressor__c2KkpJa', 'port-compressor__dQ9sEtn', 'port-compressor__4Lq66pa']",0,"[3605.937222, 3605.03076, 3606.570665, 3634.024205]","[76.773413, 41.277948, 137.202251, 103.858005]",0.0,False,[] +gpt-5,prove-plus-comm,7,"['c21fcb54-3feb-4fc9-8a2e-f7124ea72623', 'f04ee6a2-e734-45ea-aee0-a12fc823ddc1', '96a8d27a-2b18-4290-b066-e003696f4a34', 'f83aa081-4b9c-47a3-98c4-3a51c2e0ab1c', '5636de4e-337b-4383-90a8-5505af001b2c', '5981f001-af9c-46a4-8613-e7d2b3e83a83', 'b70adf84-8259-45e2-ba79-8ad4dcd87df3']","['prove-plus-comm__6XzumWd', 'prove-plus-comm__9tterfk', 'prove-plus-comm__kiTg4Lz', 'prove-plus-comm__PSkGkkz', 'prove-plus-comm__ctgZWaB', 'prove-plus-comm__78vnLZk', 'prove-plus-comm__iRLXcHE']",6,"[370.875792, 102.975392, 219.044767, 205.355998, 284.737252, 360.230246, 200.330913]","[21.566888, 10.336685, 133.977628, 27.667583, 25.999628, 140.710861, 11.995178]",0.8571428571428571,True,"['c21fcb54-3feb-4fc9-8a2e-f7124ea72623', 'f04ee6a2-e734-45ea-aee0-a12fc823ddc1', '96a8d27a-2b18-4290-b066-e003696f4a34', 'f83aa081-4b9c-47a3-98c4-3a51c2e0ab1c', '5636de4e-337b-4383-90a8-5505af001b2c', 'b70adf84-8259-45e2-ba79-8ad4dcd87df3']" +gpt-5,pypi-server,6,"['149466b5-6db1-4d8b-8283-657408679c3a', '15a108ca-8a0f-4768-925a-797299944f3a', '9f8db136-602e-4c03-9175-61a967263e50', '0af79210-dbc6-4ee7-a82a-a5dcea7a7c45', 'a65031e2-fd31-498a-ad92-9fb2a73ed322', 'af14996c-dcc9-48b5-ada1-a19346018add']","['pypi-server__jfrhbGV', 'pypi-server__ST6jkUQ', 'pypi-server__T3fcjm4', 'pypi-server__iq7QW8g', 'pypi-server__QFgCsGy', 'pypi-server__bK8hDWW']",2,"[163.696097, 358.672772, 182.954646, 183.053019, 280.939756, 209.830223]","[11.792846, 101.420854, 154.567642, 20.67982, 70.044467, 41.85312]",0.3333333333333333,False,"['149466b5-6db1-4d8b-8283-657408679c3a', '9f8db136-602e-4c03-9175-61a967263e50']" +gpt-5,pytorch-model-cli,6,"['2ef87912-4090-4887-afdb-34d376586e6c', '29814007-ef14-4d68-a6ca-6420a13b67c0', '43f4609c-8611-4ded-8bfd-a0f568591a75', '7c66249f-7d19-4818-99bc-6b18ffbbf48b', '2229f55e-8f95-418b-bd52-cc330212ddc3', '1aad6804-be75-4542-9fbc-79d5a89b6ab3']","['pytorch-model-cli__wB7kDRc', 'pytorch-model-cli__xckKGHC', 'pytorch-model-cli__T6yPfWQ', 'pytorch-model-cli__HX3GZVc', 'pytorch-model-cli__JyducYz', 'pytorch-model-cli__HLjJN5o']",0,"[268.154951, 149.855489, 515.502561, 380.339611, 900.00065, 266.112916]","[82.228005, 101.898808, 105.250219, 15.404484, 95.744451, 8.804634]",0.0,False,[] +gpt-5,pytorch-model-recovery,7,"['dda6bfb4-6e0e-487c-b3f8-cb59e9f0fbf6', 'ef12d1b0-3bae-4248-8b0e-3e405a79d1f1', 'f8b929db-54db-4269-9509-fc13931d24de', '6d86d0f1-1bd9-41f4-85e7-8bb7cc70fb53', 'c21d2c6a-a75b-4af2-9ef7-62d545054e62', '1e29b6ac-8a25-440a-9514-d027b295442b', '0bdb0a70-c7f4-4cde-b07c-2daea4655a40']","['pytorch-model-recovery__qpnJnTV', 'pytorch-model-recovery__P8kXNQK', 'pytorch-model-recovery__zqp6Wyy', 'pytorch-model-recovery__KkUtXxD', 'pytorch-model-recovery__GdBH3Tj', 'pytorch-model-recovery__cXQcUoq', 'pytorch-model-recovery__LXzE4bb']",3,"[900.001126, 901.025254, 910.361005, 370.610594, 263.355408, 900.003088, 904.457709]","[9.010043, 24.747275, 51.50629, 40.441677, 9.561439, 76.25244, 42.683755]",0.42857142857142855,False,"['6d86d0f1-1bd9-41f4-85e7-8bb7cc70fb53', 'c21d2c6a-a75b-4af2-9ef7-62d545054e62', '0bdb0a70-c7f4-4cde-b07c-2daea4655a40']" +gpt-5,qemu-alpine-ssh,6,"['af4bc0ae-2786-4af7-8c9c-6d8b1cd1c03f', '1059aecd-1da1-4806-939d-0f77a64f4e01', '1ed5ee2b-0ca3-4927-9e1c-ff1359ba684c', '199dea09-10b2-4261-9fd7-ae045ebd6b73', '1028cb15-47a2-47ea-9725-da877b19afdc', '44a66d1e-0f6f-447f-a588-2a6cbf046105']","['qemu-alpine-ssh__nfWh82m', 'qemu-alpine-ssh__34UFsVG', 'qemu-alpine-ssh__AZc9kBi', 'qemu-alpine-ssh__ezUVaKv', 'qemu-alpine-ssh__xquageC', 'qemu-alpine-ssh__haYi66i']",1,"[960.243697, 290.37141, 420.593761, 461.559064, 797.312994, 999.167004]","[23.069769, 9.911209, 2.10222, 10.88806, 31.134402, 13.170666]",0.16666666666666666,False,['1059aecd-1da1-4806-939d-0f77a64f4e01'] +gpt-5,qemu-startup,5,"['3da85369-7bca-4ffb-a41a-52b6834ad301', '4c299126-2de4-4b35-9483-008d62c86533', '67b351a2-e03e-4e78-afc5-d5467aaf9250', '446ab231-38c5-474f-b4d7-c15d25f82b6b', 'f10129e8-e9fc-4795-b8ba-f76f796b9c36']","['qemu-startup__xcJDCCZ', 'qemu-startup__z24fHUz', 'qemu-startup__7tnMCzU', 'qemu-startup__hU5Zhy7', 'qemu-startup__9eBTdy9']",4,"[905.013883, 920.1992, 228.781141, 553.60153, 193.458991]","[3.17093, 36.433332, 30.519019, 9.999872, 13.724532]",0.8,True,"['3da85369-7bca-4ffb-a41a-52b6834ad301', '67b351a2-e03e-4e78-afc5-d5467aaf9250', '446ab231-38c5-474f-b4d7-c15d25f82b6b', 'f10129e8-e9fc-4795-b8ba-f76f796b9c36']" +gpt-5,regex-log,5,"['99dc6c5d-2b02-4770-a04b-0b69eda27240', '7beb5a4b-0a7e-4103-a813-40514f0b6da6', '59c3d6eb-b706-4584-9e60-089c5be59b82', 'd4bd0d04-9a65-4d12-bbc1-3a5d52b9f3f5', '654b66e5-8da8-45d6-ae8c-2861742a24cb']","['regex-log__vtucatb', 'regex-log__ok5iXqt', 'regex-log__F8KA8N7', 'regex-log__hbJQ7eo', 'regex-log__u5GrVZn']",5,"[186.682062, 238.699203, 168.70928, 217.944763, 247.217786]","[157.086014, 180.975655, 225.123094, 19.329018, 33.937092]",1.0,True,"['99dc6c5d-2b02-4770-a04b-0b69eda27240', '7beb5a4b-0a7e-4103-a813-40514f0b6da6', '59c3d6eb-b706-4584-9e60-089c5be59b82', 'd4bd0d04-9a65-4d12-bbc1-3a5d52b9f3f5', '654b66e5-8da8-45d6-ae8c-2861742a24cb']" +gpt-5,reshard-c4-data,6,"['f6a957e6-f4fb-402c-b3eb-fd046460d669', '6c9765f8-dac9-4171-8457-118327cc7f2a', '30451bf1-2fdc-42ae-8c04-d97cabf911d8', 'c72da553-cf68-482d-aa1b-28d792bfb6cc', '1316c1bc-bc3e-431f-b5a6-de43f86d1331', 'c1cd8367-2569-4465-955f-ee41cd766df5']","['reshard-c4-data__oj9LAw2', 'reshard-c4-data__tFHkjjh', 'reshard-c4-data__3uu8HhJ', 'reshard-c4-data__KftxJzX', 'reshard-c4-data__EwtVpW2', 'reshard-c4-data__AxmfnEj']",2,"[900.001721, 573.289721, 388.870852, 900.050693, 626.964926, 478.618469]","[9.273085, 54.610207, 99.952325, 14.728554, 129.535994, 46.36423]",0.3333333333333333,False,"['f6a957e6-f4fb-402c-b3eb-fd046460d669', '30451bf1-2fdc-42ae-8c04-d97cabf911d8']" +gpt-5,reverse-engineering,6,"['8d7e07a1-69e4-4677-9beb-78756f10a8cf', '23db9073-d24e-49a2-8daa-1675270722e1', '1167ddfe-39da-4ce6-b207-748adeb1f74d', '0312a306-010b-4f77-8283-e0ab629e35fc', '7c66b406-eadb-4ca1-b515-3e08e6ce862e', '9fe16851-4f7d-4908-9cf1-e3b9849a37ed']","['reverse-engineering__vQbhzP5', 'reverse-engineering__9Hcj9Za', 'reverse-engineering__M3xfGNg', 'reverse-engineering__dThUe4R', 'reverse-engineering__3uPALAW', 'reverse-engineering__6zZLsHB']",4,"[1824.395143, 921.824824, 1800.070388, 1139.728573, 606.120466, 585.201575]","[17.587637, 78.139616, 19.319989, 73.235257, 8.404357, 26.538598]",0.6666666666666666,True,"['23db9073-d24e-49a2-8daa-1675270722e1', '0312a306-010b-4f77-8283-e0ab629e35fc', '7c66b406-eadb-4ca1-b515-3e08e6ce862e', '9fe16851-4f7d-4908-9cf1-e3b9849a37ed']" +gpt-5,run-pdp11-code,5,"['1919cf9a-1fd6-4bde-aaae-caaa9e851c49', 'd7a5d5ca-e2bb-4d0b-9cd1-0e8fb4b699f0', 'e31f7c5b-fcf2-4b90-925a-60b2ddce2a18', '7d5a1b21-6d5a-493d-96f8-97570ba74cc2', 'dde43d64-6bfe-40c1-89fc-37ec7520a2bb']","['run-pdp11-code__6R2MA8d', 'run-pdp11-code__BkAWfPM', 'run-pdp11-code__nq4Noz8', 'run-pdp11-code__Lp2neVb', 'run-pdp11-code__dRMAoQQ']",0,"[1007.683648, 914.572972, 534.175527, 1003.639201, 1013.657169]","[74.942647, 105.600511, 29.78986, 71.898024, 202.5436]",0.0,False,[] +gpt-5,sanitize-git-repo,7,"['f69277b5-c127-47d3-8c69-678d7011c3b3', '241c821d-3cf7-4a42-96cd-b552663cf3a6', 'f242a9ae-cc73-4911-8070-8cf8c815d9eb', 'cc582766-9a2c-46ed-b83a-d74c60fa5658', 'b861f4d6-3b62-4352-b87f-7b95eb997c42', '313343a4-9165-4387-9b77-41bd26100869', 'a6bae596-4bf1-4f90-9237-c5b4c5773712']","['sanitize-git-repo__jj8B6xA', 'sanitize-git-repo__s2AdyCK', 'sanitize-git-repo__Z3JibUD', 'sanitize-git-repo__7Y44Qhc', 'sanitize-git-repo__voUesVs', 'sanitize-git-repo__rdf7Pjx', 'sanitize-git-repo__uuksR6G']",2,"[687.354037, 551.618061, 1323.975506, 900.094246, 812.035069, 350.852476, 916.477618]","[66.182756, 7.659214, 225.744919, 64.470737, 78.622541, 10.173409, 21.806599]",0.2857142857142857,False,"['f69277b5-c127-47d3-8c69-678d7011c3b3', '313343a4-9165-4387-9b77-41bd26100869']" +gpt-5,schemelike-metacircular-eval,6,"['51b5bd62-b69d-466b-af88-516dc805c0e0', 'a771d2b7-bd6c-4254-a1ea-cad7f7725e5e', '1ae3b58f-28ca-412b-962d-2e29e0651b17', '5d466124-a81f-41bd-a4c3-9fa7cd305594', 'f3209a38-095f-4b2a-af15-d86fc4264d5f', 'b8ab6e99-fd03-4610-8677-8b6d0db9e00f']","['schemelike-metacircular-eval__G9k36o6', 'schemelike-metacircular-eval__F6XUyRg', 'schemelike-metacircular-eval__EdumHaW', 'schemelike-metacircular-eval__HdEfxVp', 'schemelike-metacircular-eval__qedQuXW', 'schemelike-metacircular-eval__DmFBCry']",0,"[2401.158472, 2400.99404, 2411.939929, 2402.016763, 2400.007932, 2400.010103]","[197.361385, 121.252109, 46.014211, 160.584081, 9.181892, 111.261594]",0.0,False,[] +gpt-5,sparql-university,5,"['a1cbb638-d051-4b6e-b15e-b1bad9716260', 'afdfcef2-8fee-4281-b3b3-a837923aa32b', '32b4a7a5-40d5-4c67-9798-40d5dd4ff4e3', '32a49cbc-4893-42fa-9cb4-e728667d393c', 'fe3f0b9d-b340-4b27-bf69-892b528bab55']","['sparql-university__4ma2WRW', 'sparql-university__xZEGfVQ', 'sparql-university__A8pAXMk', 'sparql-university__PcgqxBT', 'sparql-university__bRn826N']",4,"[223.38647, 354.514843, 341.788481, 332.210858, 598.274627]","[119.617046, 59.310407, 61.989563, 55.462359, 231.678874]",0.8,True,"['a1cbb638-d051-4b6e-b15e-b1bad9716260', 'afdfcef2-8fee-4281-b3b3-a837923aa32b', '32a49cbc-4893-42fa-9cb4-e728667d393c', 'fe3f0b9d-b340-4b27-bf69-892b528bab55']" +gpt-5,sqlite-db-truncate,7,"['4aa13201-97bd-4e63-8fa8-e76e4fc039c4', '2d23f238-75a0-4324-a18b-2f4a99a3918d', 'a3a0c9e8-d57a-4abd-96a8-fb603013966b', '162b9cfd-00af-4ddd-9470-5bb9f62cc793', 'ced8e5ff-93dc-482e-91fd-7fefe669c916', 'ac945708-daec-418a-9965-578dc75284bb', 'd3ee9792-1560-48e6-a69e-14b393301e50']","['sqlite-db-truncate__G3MMdK5', 'sqlite-db-truncate__mMDxdsc', 'sqlite-db-truncate__eKCio8c', 'sqlite-db-truncate__Dzg2xrY', 'sqlite-db-truncate__rkf3TXD', 'sqlite-db-truncate__Q5Ca3G3', 'sqlite-db-truncate__P7YgUY5']",0,"[533.71273, 859.7268, 345.961631, 121.735473, 426.899398, 622.8403, 902.54355]","[48.426867, 28.123772, 11.865572, 9.11589, 46.654469, 120.96924, 20.508237]",0.0,False,[] +gpt-5,sqlite-with-gcov,6,"['ddc92b38-9466-41a5-99ec-e31a709ba96e', '35f8f37c-134f-4995-9f11-d440e6a8de25', '52b8dfa7-4997-40ee-b92b-18d6dea22fdc', '622fd5f6-741a-44db-9935-6008fcd31d34', 'fdc82994-15a6-4eaa-840b-abe86cce435e', '9ceda5c9-8776-40d5-8044-68e252904863']","['sqlite-with-gcov__6pxrpGS', 'sqlite-with-gcov__GPR7z5w', 'sqlite-with-gcov__eywFLF2', 'sqlite-with-gcov__TH67UPA', 'sqlite-with-gcov__bTmqs3S', 'sqlite-with-gcov__znHuFmi']",2,"[436.212848, 402.98383, 334.186121, 325.941034, 553.358463, 660.777727]","[105.029621, 58.344799, 36.174083, 16.037565, 46.252575, 25.617673]",0.3333333333333333,False,"['52b8dfa7-4997-40ee-b92b-18d6dea22fdc', '9ceda5c9-8776-40d5-8044-68e252904863']" +gpt-5,torch-tensor-parallelism,6,"['4ab88066-e885-44a2-9c24-94c635a3f7f6', '3dc6ee1d-c738-42df-9d4f-f9ab5105377d', '7f3496a1-13ee-415c-8157-2359add0aa30', '28a0e44b-064b-4fb5-a137-3d2f86c548f6', 'ffb28932-018e-4caa-bd35-c5cf59a53122', 'a6adc374-afbf-4a74-8100-eb78326711ea']","['torch-tensor-parallelism__jSzZ8Ut', 'torch-tensor-parallelism__ViQ8kRu', 'torch-tensor-parallelism__qpxdnBK', 'torch-tensor-parallelism__HGMvCrP', 'torch-tensor-parallelism__DnzfdRR', 'torch-tensor-parallelism__WLGtUa7']",0,"[204.641127, 255.797965, 366.392131, 513.068155, 168.983089, 234.572263]","[138.893892, 47.262796, 37.35833, 82.77083, 17.244252, 56.132675]",0.0,False,[] +gpt-5,train-fasttext,5,"['db727f81-ca38-4bf5-8464-a9f1b7d3f610', 'c26f7a7b-2f4b-4ff1-8232-7e44d8fb28bb', 'b633aacc-dcff-4f8e-a650-7d1d0f72092d', 'ab15ff57-828d-4ab1-8752-34bd1c0d9c90', '2bb45cc0-f0fc-4aba-bd12-b45ca6148f38']","['train-fasttext__oW4w67M', 'train-fasttext__ZNMv2uB', 'train-fasttext__eKJd8TB', 'train-fasttext__hKnhFu2', 'train-fasttext__7UAGjYp']",0,"[3624.595999, 3648.158015, 3621.195862, 3600.5908, 3615.256775]","[32.828283, 23.456096, 28.549253, 21.054708, 37.265477]",0.0,False,[] +gpt-5,tune-mjcf,7,"['01b5556e-d6be-49cd-85bf-30724e006683', 'fd315990-06cb-451a-972d-527e2b67435f', '8cf0bd23-e9e7-44d6-b41c-a5071722d981', '9239f3c7-d6d0-48ce-9b2c-07953a509501', '3c39cdce-39e3-491c-9c4a-e35bb122b626', '5bc41dd8-6f5b-4e9d-abb2-eed152f2acb2', 'ded69ace-95cd-43ca-ab69-53632c0b4ab4']","['tune-mjcf__fzmEwFj', 'tune-mjcf__R4t4guy', 'tune-mjcf__MsQkxJT', 'tune-mjcf__omFZfMs', 'tune-mjcf__UoBGPSD', 'tune-mjcf__UU33duQ', 'tune-mjcf__XGLa6Sy']",0,"[903.789968, 932.103897, 900.711382, 900.000325, 905.418281, 963.670652, 900.001077]","[24.775222, 19.086173, 8.309458, 11.294213, 26.155657, 33.055301, 21.898039]",0.0,False,[] +gpt-5,video-processing,5,"['c12acb24-1dfa-477c-9249-3fcfa4dafa15', '3d59670f-f03c-4de4-abb8-845522599496', '7e1f9aec-c1a5-4c77-9489-88a90ca767ad', '04bfb531-0353-4cb7-af04-2f13eed81753', '3c13f6df-2120-45c9-aeb7-18f6f2824af7']","['video-processing__QW6Uo2R', 'video-processing__igG7gJP', 'video-processing__M9d9435', 'video-processing__iTxVR6T', 'video-processing__WLK8Kpu']",0,"[248.232755, 278.140621, 211.50711, 326.26183, 219.297213]","[107.85115, 34.391403, 37.86666, 53.065259, 39.941648]",0.0,False,[] +gpt-5,vulnerable-secret,7,"['2eebefca-c851-487b-a2dd-c01eb85cafe2', 'a77a7663-92ac-4404-8432-dfae4a94f971', '48a3250a-06f8-40df-9618-990fccea3ef8', 'ffb59b60-5052-4275-b34a-1fa69d9475fe', '6ade59a9-97ae-41e5-ab64-d68f42099dbc', '760efc82-9101-4a26-9df3-e87cc0103cb3', '63269270-3db3-4fe4-9521-114dc49ad787']","['vulnerable-secret__qL9omFF', 'vulnerable-secret__9SpjGU6', 'vulnerable-secret__Gy72yYt', 'vulnerable-secret__FZETqFY', 'vulnerable-secret__yn9fjLW', 'vulnerable-secret__JRqMjcu', 'vulnerable-secret__BRRPDUW']",2,"[485.781482, 923.786604, 920.045444, 901.358977, 900.001249, 417.905626, 977.156881]","[10.939889, 92.011013, 12.741224, 7.486536, 10.165231, 23.263853, 38.344186]",0.2857142857142857,False,"['2eebefca-c851-487b-a2dd-c01eb85cafe2', '760efc82-9101-4a26-9df3-e87cc0103cb3']" +gpt-5,wasm-pipeline,6,"['e9da34a1-f7d9-4227-815d-fe46b4e225f2', '8bbabfb2-264b-4fae-9d0e-133db184896b', 'df04802d-c892-4a9c-bceb-4987130145fd', '665c7647-871f-4cdd-bcca-aeb4f9814ca5', '79be448e-3684-4991-be44-cc2de2616429', 'e88c80e3-b8ad-4aba-9fc3-4377e6e1638b']","['wasm-pipeline__8fNe4gc', 'wasm-pipeline__QveJ2tP', 'wasm-pipeline__zUHoh4D', 'wasm-pipeline__G4AsmJt', 'wasm-pipeline__8jnq3z9', 'wasm-pipeline__DxMCumo']",6,"[797.098302, 171.387898, 697.914905, 334.868496, 408.366168, 669.227777]","[7.955167, 2.03718, 21.043617, 5.344225, 4.335014, 13.741119]",1.0,True,"['e9da34a1-f7d9-4227-815d-fe46b4e225f2', '8bbabfb2-264b-4fae-9d0e-133db184896b', 'df04802d-c892-4a9c-bceb-4987130145fd', '665c7647-871f-4cdd-bcca-aeb4f9814ca5', '79be448e-3684-4991-be44-cc2de2616429', 'e88c80e3-b8ad-4aba-9fc3-4377e6e1638b']" +gpt-5,winning-avg-corewars,7,"['89694e03-4fb7-4755-a838-09aa918f8bbe', '8f35d819-3c21-453e-b571-88d244f16692', '9df4c247-fed5-4d32-b2c2-9e6bdc72a573', '131933a1-ceb2-4f41-a125-aa0ad45bf861', '87b821c8-0f87-4f4c-a923-60bfb7660416', '412f034e-057f-4601-a199-8905f6db9312', '6a0c7800-5ac9-4494-b557-27455630fba1']","['winning-avg-corewars__kXGiAx9', 'winning-avg-corewars__ozJ4dZN', 'winning-avg-corewars__FcUASZS', 'winning-avg-corewars__SUuPDtT', 'winning-avg-corewars__RBxmVCQ', 'winning-avg-corewars__NcSDz9A', 'winning-avg-corewars__ZN5WWjh']",2,"[3603.644069, 3621.26844, 974.993514, 2896.633235, 3600.55112, 3608.612061, 1408.781807]","[29.23166, 4.832629, 2.189361, 83.328998, 16.060615, 9.115705, 3.151715]",0.2857142857142857,False,"['9df4c247-fed5-4d32-b2c2-9e6bdc72a573', '131933a1-ceb2-4f41-a125-aa0ad45bf861']" +gpt-5,write-compressor,6,"['412632cc-aac1-47d1-85bd-1afd32e384f6', 'f5ea7123-b733-4901-94b6-d72e3799f09c', 'b8413636-42b0-4b7e-9f02-006bf9813646', 'fc1eccda-d40b-4ece-b7ea-dcd03d3bbeed', '201e3378-70f0-4bef-b329-73601ef2bc7d', '62a09aec-f472-43a2-81ae-a6162b9a55de']","['write-compressor__A5EXbUB', 'write-compressor__mByiNh4', 'write-compressor__iCK3shA', 'write-compressor__JdSR82L', 'write-compressor__gXSuwMx', 'write-compressor__8hFY74L']",2,"[900.250943, 707.465168, 817.941795, 893.131821, 906.284959, 900.527563]","[55.188902, 37.50494, 16.752299, 141.710948, 82.122405, 45.038597]",0.3333333333333333,False,"['f5ea7123-b733-4901-94b6-d72e3799f09c', 'b8413636-42b0-4b7e-9f02-006bf9813646']" +gpt-5-mini,adaptive-rejection-sampler,5,"['5ac7e773-e660-424d-815e-dcdede114691', 'a34b2203-8a62-47ca-8d25-28da78aed828', '3b43e2b5-a1b0-4bce-b825-c1bd26347e87', 'ecbbd069-5400-4116-b9ac-54260cc9fcd3', 'ee3043c4-c0a3-497b-b665-6e7658461dc8']","['adaptive-rejection-sampler__VkwBnQr', 'adaptive-rejection-sampler__9RXqb6a', 'adaptive-rejection-sampler__WiYDQhM', 'adaptive-rejection-sampler__Qxe4TEJ', 'adaptive-rejection-sampler__82TPzeC']",2,"[946.678663, 900.006354, 772.160986, 676.379444, 900.037299]","[64.366436, 74.806225, 231.964638, 28.097344, 99.085099]",0.4,False,"['a34b2203-8a62-47ca-8d25-28da78aed828', 'ecbbd069-5400-4116-b9ac-54260cc9fcd3']" +gpt-5-mini,bn-fit-modify,5,"['cbabe714-548d-4301-9c53-92d701deb332', 'a5a65fa5-09d4-4e7d-8b68-f04aeec0e0e1', '086eee7f-9cf0-4ed2-a5ff-7e543c73a31f', 'a4907b05-ef73-49ab-9f37-4937ad5de09c', '7c502efa-440c-4d72-8ee6-ccc591cc85f8']","['bn-fit-modify__RvSGSEU', 'bn-fit-modify__cfnectH', 'bn-fit-modify__69F929H', 'bn-fit-modify__vebVH3t', 'bn-fit-modify__Uj2LcBy']",3,"[234.143162, 516.950439, 596.082064, 458.541134, 922.214965]","[45.785209, 275.67976, 67.900913, 22.130757, 197.679985]",0.6,True,"['086eee7f-9cf0-4ed2-a5ff-7e543c73a31f', 'a4907b05-ef73-49ab-9f37-4937ad5de09c', '7c502efa-440c-4d72-8ee6-ccc591cc85f8']" +gpt-5-mini,break-filter-js-from-html,5,"['d3f18a4f-3473-4420-bd11-a8a99402db36', '19665476-e62b-4db5-bd6d-af1f54c2e1be', 'bc78da9d-0314-4fb1-820c-81b24a09f2ac', 'b1b73a7c-6385-4a4c-89bd-70fdba0eda5f', 'eb1600dc-eb83-4359-b7c3-4838da522f94']","['break-filter-js-from-html__swgzvFN', 'break-filter-js-from-html__EdsaXuz', 'break-filter-js-from-html__cYBmvKG', 'break-filter-js-from-html__nLweD3H', 'break-filter-js-from-html__FKLysvH']",0,"[348.146137, 318.149611, 170.990975, 334.171093, 175.414401]","[11.367755, 55.741444, 78.959214, 29.626709, 13.514899]",0.0,False,[] +gpt-5-mini,build-cython-ext,5,"['b3e08346-d525-426c-b963-e1bf69c9a8f3', '50cb1a63-0aa0-4785-ae16-d365d5db67e6', 'd9dafa1c-e162-4448-a732-d1ef9696edf0', 'af44d6e2-e890-4da5-bd1c-87b6f74aab9f', '33ead04b-d8d3-4b54-b232-4bc9421e7a8f']","['build-cython-ext__cmFfA99', 'build-cython-ext__t6xP3DT', 'build-cython-ext__BEH8RNj', 'build-cython-ext__bDi7SCF', 'build-cython-ext__Wuixe83']",1,"[910.923358, 940.840837, 900.469947, 904.489212, 901.121688]","[13.3387, 102.170203, 17.466234, 43.481336, 151.472632]",0.2,False,['33ead04b-d8d3-4b54-b232-4bc9421e7a8f'] +gpt-5-mini,build-initramfs-qemu,2,"['b9c5b36a-db33-4a34-ae6e-09ec5e5939cd', '61985c81-214f-4a68-a27b-4a43a3fbb78e']","['build-initramfs-qemu__EjTyXem', 'build-initramfs-qemu__qVDskFY']",0,"[900.568735, 135.585142]","[207.543578, 10.519464]",0.0,False,[] +gpt-5-mini,build-pmars,5,"['967648d1-efad-453d-80f4-7bc2233b80ec', 'eb508604-8ad6-438c-98fc-e5fcbb9f99c5', 'daf4b291-5ba1-4ed3-9636-cb7dccfda898', '092dccba-32eb-491d-b1df-db315b885144', 'b1dc7dfa-386d-41eb-b055-63d6479b5d81']","['build-pmars__4wLCKKG', 'build-pmars__ucDXahf', 'build-pmars__LrgEwNT', 'build-pmars__2DcbA3J', 'build-pmars__6APrjfR']",1,"[903.912323, 604.95726, 2063.485858, 921.000067, 948.159392]","[41.156816, 6.240819, 4.518885, 59.955662, 4.008926]",0.2,False,['eb508604-8ad6-438c-98fc-e5fcbb9f99c5'] +gpt-5-mini,build-pov-ray,5,"['b16129eb-7d7d-4b46-85d6-3d63ee08bfe7', '2571de58-8684-42ef-a825-4b8ee35fe5d5', '3fb7cd02-0166-4f4a-bd68-e2fbf9807944', '66844dda-35e6-4e87-9251-260e0f8f9339', '7ff09eb3-af62-464f-971c-3fe7b1d141f4']","['build-pov-ray__cva4cgo', 'build-pov-ray__fV6rbYF', 'build-pov-ray__F8d8qP9', 'build-pov-ray__VWBmDmL', 'build-pov-ray__Mf5xtPP']",0,"[6005.852133, 1755.048156, 6000.014509, 960.79387, 870.001616]","[119.02043, 100.239486, 32.149612, 68.545826, 28.103519]",0.0,False,[] +gpt-5-mini,cancel-async-tasks,5,"['e9c21109-98b5-4153-a6a0-5ba4b01ef7fa', 'e1a72fef-b8cd-46bb-8aa3-f504a431046c', '71fef181-990a-4f97-94b4-1c39ea66e95c', '207b34fd-80d1-41f7-8624-6ef0b7f0dc72', 'dd0fca22-7153-4e63-8d9a-34a2eebe54bb']","['cancel-async-tasks__g8SvaHX', 'cancel-async-tasks__73wekyn', 'cancel-async-tasks__v7KcMHX', 'cancel-async-tasks__szDgJX5', 'cancel-async-tasks__MFpJUeQ']",2,"[88.83292, 119.909751, 119.079362, 439.725406, 80.501672]","[88.789626, 103.864425, 70.971078, 337.354594, 51.046223]",0.4,False,"['71fef181-990a-4f97-94b4-1c39ea66e95c', 'dd0fca22-7153-4e63-8d9a-34a2eebe54bb']" +gpt-5-mini,chess-best-move,5,"['19d5dad0-86e9-4835-8099-667c6757bef3', 'f3314122-cf6d-4127-a9c1-88463b8ed8dd', 'b59f150b-8b59-4d24-98f5-6d999fb75cab', 'c27b65a0-4c91-4f6f-b501-82382ebc4d8d', '79d64d86-3e7c-4aa5-a892-32a78b9328f2']","['chess-best-move__YHm96Qt', 'chess-best-move__psxTY8i', 'chess-best-move__JncetSn', 'chess-best-move__z5Ynggj', 'chess-best-move__fFoSxF7']",0,"[805.153257, 906.753355, 904.543426, 652.434609, 902.766475]","[7.83687, 243.427872, 41.020731, 155.016315, 14.362144]",0.0,False,[] +gpt-5-mini,circuit-fibsqrt,5,"['c9c0b55a-49f2-46a4-8b94-ca8679010cac', '6cedb864-dfdd-4b8c-8c2b-f133a68c9811', '78f0df05-f587-4a4d-8de2-56d0da1cf5fe', 'f0407181-42a8-42f4-bc96-450f35a84397', '7a4207b9-7cea-453d-92db-0a29babefa85']","['circuit-fibsqrt__pVtt6Uf', 'circuit-fibsqrt__9yNm5yQ', 'circuit-fibsqrt__gnRLUCg', 'circuit-fibsqrt__JKAHCcm', 'circuit-fibsqrt__efPmDRp']",0,"[3617.064916, 3605.65617, 3605.750887, 468.453283, 109.78106]","[51.948146, 28.543856, 14.308915, 84.71502, 78.071712]",0.0,False,[] +gpt-5-mini,cobol-modernization,5,"['d7af17dd-2c83-4d4e-9f5d-db12d7fe76db', '77d98bf1-2fd1-4540-9bd6-80e189de6cee', '4bef9563-e93d-4b88-bf3d-bfacb401ef98', 'e65cb80e-d306-4c06-bd34-3cebb703917a', '48f6b31b-e463-4816-8d8e-1aa58eb9cc92']","['cobol-modernization__eM4HK5K', 'cobol-modernization__pKtauiX', 'cobol-modernization__F3e9uAL', 'cobol-modernization__3WSYnnE', 'cobol-modernization__8e5BtKU']",5,"[348.578684, 665.606813, 324.869764, 494.87513, 262.038942]","[47.552834, 165.555758, 52.810239, 46.037647, 49.000811]",1.0,True,"['d7af17dd-2c83-4d4e-9f5d-db12d7fe76db', '77d98bf1-2fd1-4540-9bd6-80e189de6cee', '4bef9563-e93d-4b88-bf3d-bfacb401ef98', 'e65cb80e-d306-4c06-bd34-3cebb703917a', '48f6b31b-e463-4816-8d8e-1aa58eb9cc92']" +gpt-5-mini,code-from-image,5,"['4df69ee3-8d7e-4019-a33b-eb894ad68f4e', '28693443-691e-4ad7-b412-d92790eb616a', '34746c8c-c141-4dc3-bc2a-a2a1153fcf22', 'cd6f129c-7664-4a93-9856-b4e79ca1e6e8', '3b6709e6-cfa4-4551-b376-fb7c2966129b']","['code-from-image__fCHjUXy', 'code-from-image__RGJoJbF', 'code-from-image__rQEaJ9z', 'code-from-image__HFvcH9m', 'code-from-image__rocQnDL']",0,"[1200.219384, 1219.535198, 1201.814291, 1217.799886, 1200.001952]","[32.763359, 25.009147, 37.140605, 217.323123, 79.5932]",0.0,False,[] +gpt-5-mini,configure-git-webserver,5,"['022e116a-8e48-46f4-8851-16d0f4ecfd30', 'bb27bd2e-4406-481f-8aa2-506ea6a4bf36', 'd1f205aa-ab0a-4f98-b5bd-b01f51f6129b', 'cae30b61-6509-4c48-9a9b-1ca2a188926a', 'd1669f60-bd1a-4b26-95b0-3ee7629fb867']","['configure-git-webserver__rogQxhp', 'configure-git-webserver__nE5ktWq', 'configure-git-webserver__38KKZtc', 'configure-git-webserver__7BkBDtp', 'configure-git-webserver__bWMMcap']",3,"[134.555983, 460.030772, 270.607702, 296.458239, 388.061256]","[70.827498, 38.593757, 257.74099, 33.657244, 34.248438]",0.6,True,"['022e116a-8e48-46f4-8851-16d0f4ecfd30', 'cae30b61-6509-4c48-9a9b-1ca2a188926a', 'd1669f60-bd1a-4b26-95b0-3ee7629fb867']" +gpt-5-mini,constraints-scheduling,5,"['81cd5f3d-2d04-4e32-8725-d673b504d24c', '649303d3-19fd-4c73-8be9-9b7b59c5856c', '05238921-61a2-4282-abb4-9204bb623204', 'dd71d284-491a-4ff9-999a-3c5b4d5b02b1', '1e9984ca-4e75-408f-b262-ecf4800fe727']","['constraints-scheduling__RVUAYjr', 'constraints-scheduling__z9dwTJT', 'constraints-scheduling__Dfw5St5', 'constraints-scheduling__Xjzm8tu', 'constraints-scheduling__sYfk59x']",4,"[125.094261, 279.480295, 257.038028, 276.107046, 461.605981]","[13.952334, 108.21555, 73.512551, 57.789326, 219.259087]",0.8,True,"['81cd5f3d-2d04-4e32-8725-d673b504d24c', '649303d3-19fd-4c73-8be9-9b7b59c5856c', 'dd71d284-491a-4ff9-999a-3c5b4d5b02b1', '1e9984ca-4e75-408f-b262-ecf4800fe727']" +gpt-5-mini,count-dataset-tokens,5,"['4801255f-93bb-4a2d-bd2c-d38c10b9a2e6', '43511834-5e9a-4084-afc8-cd5d47201c33', '19859aa6-f1cc-4e75-a2a6-5db0156a6d06', '230ef66e-5a8b-4b46-8ddc-727491b5b964', '462f180b-28ea-4829-9bdf-cd1d1408c285']","['count-dataset-tokens__tsz3LnP', 'count-dataset-tokens__Gs63JJv', 'count-dataset-tokens__swrytsm', 'count-dataset-tokens__zyfWHAY', 'count-dataset-tokens__4SsuKpc']",0,"[900.058877, 756.869092, 915.990035, 908.704351, 920.029806]","[8.476016, 111.821264, 30.376337, 23.897454, 45.555575]",0.0,False,[] +gpt-5-mini,crack-7z-hash,5,"['ab4fff6e-2999-43c2-9776-726b1efa65c2', '9393fcd9-2ad1-416a-b62c-82009c277103', '9287adce-e437-43a9-a80a-7024048aff5a', '1f358e6d-0c41-4026-b2b9-5facdf6758d5', 'a4418230-04b9-43c8-94f2-5705649cc023']","['crack-7z-hash__qTYb4te', 'crack-7z-hash__vBJY2xx', 'crack-7z-hash__yZJkWAp', 'crack-7z-hash__RnmpKJM', 'crack-7z-hash__EqBKpXF']",0,"[87.18888, 68.630062, 544.50342, 38.473258, 900.025975]","[17.952297, 30.963026, 34.356492, 11.563662, 50.183093]",0.0,False,[] +gpt-5-mini,db-wal-recovery,5,"['be62c2d2-27b9-4312-a6e5-92de5f442a40', '406de4ef-6bb1-4608-97d9-10fc1834b3e0', 'b46001ea-ae53-41e0-a41a-0a0f78529981', '0d0edd5d-051e-4539-9cc1-416a7ff82abb', '5e963ba5-83a1-419e-b28a-a37e71fe6c3d']","['db-wal-recovery__uSjx6eq', 'db-wal-recovery__i63s6bC', 'db-wal-recovery__3Sk6e7c', 'db-wal-recovery__LJVJXpi', 'db-wal-recovery__7cRyRPG']",0,"[901.020909, 343.972251, 171.910375, 488.102633, 971.119018]","[7.575081, 51.591361, 20.350335, 15.730101, 39.055524]",0.0,False,[] +gpt-5-mini,distribution-search,5,"['52a07a4d-fcb0-41b0-8435-cfc29f2a0666', '5e56ea48-a2e9-4ff3-a960-1ad4d38b53b7', '9a5af79d-fb5c-4d63-88cb-a176b53e86b8', '3eaaeeef-de36-4695-960b-3559aa485b32', '640941e1-b733-4c6d-a7b6-0c509318dd4c']","['distribution-search__QVdD4eE', 'distribution-search__RBbNdXx', 'distribution-search__WonhsbK', 'distribution-search__cgitgGQ', 'distribution-search__gVmwTot']",5,"[1429.156094, 2123.276968, 1309.206797, 863.045016, 297.626007]","[22.51652, 160.179931, 50.427502, 31.619609, 156.174052]",1.0,True,"['52a07a4d-fcb0-41b0-8435-cfc29f2a0666', '5e56ea48-a2e9-4ff3-a960-1ad4d38b53b7', '9a5af79d-fb5c-4d63-88cb-a176b53e86b8', '3eaaeeef-de36-4695-960b-3559aa485b32', '640941e1-b733-4c6d-a7b6-0c509318dd4c']" +gpt-5-mini,dna-assembly,5,"['fa8b227a-424d-4e14-bcb3-322b741600ad', '86bdef5a-7f00-46fe-a1da-e049def48660', '3c148fd0-5f94-4e67-800d-ca9c66f6f0ed', '87f64194-cdc8-4a5d-a270-d0f7374ccb12', 'be1cdc26-3239-42f8-849b-9c78e47d48a2']","['dna-assembly__48vwkuv', 'dna-assembly__9KRaGVe', 'dna-assembly__VidxRgW', 'dna-assembly__4PFBJjK', 'dna-assembly__Spu7jku']",0,"[720.074785, 230.196528, 720.089836, 737.071645, 753.47746]","[78.555246, 69.923172, 97.842105, 32.992603, 41.149436]",0.0,False,[] +gpt-5-mini,dna-insert,5,"['5ca54a18-7919-4eb2-b504-3aa291b3a3f4', '21e9f546-dc34-449a-8163-6f1fa434b641', '20e3922f-8209-4f2d-bdb4-5d895e088d21', '65618365-9d10-4eb3-b9c1-31053a1273fb', '09d88c43-88e6-4a98-a6e9-c32e2f1add4b']","['dna-insert__EcLMp2E', 'dna-insert__68P9v3D', 'dna-insert__6LansjW', 'dna-insert__LxXi5xA', 'dna-insert__CPyZQSX']",0,"[369.690304, 387.555517, 360.669975, 453.338066, 363.505823]","[34.291053, 41.78666, 63.464327, 51.501523, 20.800538]",0.0,False,[] +gpt-5-mini,extract-elf,5,"['6c916892-6d20-4cd3-b501-7c8f1d1f74aa', 'dbac6eae-042d-4b33-afc6-4247d2710b99', '654f15a3-eb15-4b57-a050-e1d6eef6129e', '595e69cb-bf16-42f2-ba4c-b9a66299fcec', '4a7b5122-cf42-441e-989d-8495d975beab']","['extract-elf__snX6CSc', 'extract-elf__hG4LJE5', 'extract-elf__Dt6Ph8j', 'extract-elf__GFf4bcY', 'extract-elf__BK8yUVf']",3,"[155.241286, 300.908164, 210.088688, 227.823148, 277.409099]","[58.447225, 125.927587, 37.610116, 91.54854, 31.041228]",0.6,True,"['6c916892-6d20-4cd3-b501-7c8f1d1f74aa', 'dbac6eae-042d-4b33-afc6-4247d2710b99', '654f15a3-eb15-4b57-a050-e1d6eef6129e']" +gpt-5-mini,feal-differential-cryptanalysis,5,"['58028152-1114-4c65-9ee9-18a6f8605195', '21116792-02f2-448d-a096-6c493e3dae40', '4819bfcf-4bef-42f7-817b-bc90db91591d', '770daba9-fc1b-472c-ab07-65c8a4ef928a', '5dea9c69-032a-4195-9e6e-a495b9ee114b']","['feal-differential-cryptanalysis__4GNZBYS', 'feal-differential-cryptanalysis__bVmjb3T', 'feal-differential-cryptanalysis__jg5URBf', 'feal-differential-cryptanalysis__7ExYS3W', 'feal-differential-cryptanalysis__3kQNHq2']",0,"[354.333943, 246.990724, 289.31515, 373.724736, 1079.920374]","[10.836724, 50.642613, 88.966717, 14.241925, 194.176649]",0.0,False,[] +gpt-5-mini,feal-linear-cryptanalysis,5,"['1207a56c-016c-47e9-ab6d-45cf538b7af8', '88ff674f-519b-4fa9-9836-9c8cddedf725', '9d5baf9c-d9af-4c03-b0b8-4346dcfd1977', '3ae5dc49-8577-4768-bebe-d13281a1e833', 'e55ecae2-58f3-4d99-8e65-641725906518']","['feal-linear-cryptanalysis__YNBE8jd', 'feal-linear-cryptanalysis__zmNc4BY', 'feal-linear-cryptanalysis__3RrbUc4', 'feal-linear-cryptanalysis__8Xo7TEM', 'feal-linear-cryptanalysis__6DWPGs6']",0,"[1800.967376, 670.06386, 1800.055538, 1805.88624, 1815.211643]","[20.757714, 80.848167, 12.854684, 57.102209, 60.32363]",0.0,False,[] +gpt-5-mini,filter-js-from-html,5,"['123b234a-2a31-473d-937b-dde198f48837', '5812557d-5e3b-4f9b-9375-105da96b6e64', 'af895e31-122e-4263-bbe1-13d5904723a8', '7bd97228-02ee-4869-96a4-158daa667939', '0235ccea-860e-440c-94b7-8cb224c6a8ac']","['filter-js-from-html__D5Cf43o', 'filter-js-from-html__ZpnnWfa', 'filter-js-from-html__xP6FgpK', 'filter-js-from-html__dKhopcS', 'filter-js-from-html__KbkA3JH']",0,"[567.152518, 231.185136, 126.025126, 286.460354, 217.306991]","[86.324813, 125.407917, 79.510038, 51.383524, 53.179001]",0.0,False,[] +gpt-5-mini,financial-document-processor,5,"['96448c0f-b062-41b5-9de1-1404ad727b96', 'feaf761c-261a-4830-9346-a5382bcfe348', '932c3ea9-fbf9-42dc-8a74-5e3835f88734', 'b841f96f-063c-44c6-a480-10e4f6fadbfb', 'de79d0fe-4ad6-433e-960a-338a817b5739']","['financial-document-processor__VdneXoJ', 'financial-document-processor__VhXj5WB', 'financial-document-processor__5kvVNUN', 'financial-document-processor__cFWTSmT', 'financial-document-processor__bMSS8Ju']",0,"[304.944171, 200.88557, 1200.544146, 187.002199, 484.417215]","[266.306084, 21.838226, 69.878915, 140.542531, 16.014394]",0.0,False,[] +gpt-5-mini,fix-code-vulnerability,5,"['6b16f7be-5916-46a1-882b-efe399c166cf', 'b78b8f96-a08c-456e-9b19-413560af85c0', '793f0a0a-4a22-46ce-933f-fa7649fb8af2', '10699f84-e9ae-4c9c-a0b2-34545eacd4ca', '3de59e94-3567-48ee-8d51-13ac73600e40']","['fix-code-vulnerability__qaBr2bm', 'fix-code-vulnerability__gMFsrT9', 'fix-code-vulnerability__sB9UdV5', 'fix-code-vulnerability__YVNLWPN', 'fix-code-vulnerability__jHmhqeQ']",0,"[900.450205, 952.186401, 967.265609, 904.18628, 900.312394]","[4.298248, 11.157668, 67.105305, 72.811727, 79.971299]",0.0,False,[] +gpt-5-mini,fix-git,5,"['1cfce4b8-cfdf-408a-acf7-c3b9497cbb72', '5e5bf6ea-c454-4c8c-b20f-aa5e662b6415', '13f81cda-2878-447b-b986-02fe56452509', '18cefb64-eb87-4470-a1f6-a728fd04db81', '578f6b33-23dd-4fdb-bbcb-a7ae0349bb6d']","['fix-git__ZBVrhWC', 'fix-git__Z47wEUc', 'fix-git__BivJ5wX', 'fix-git__SAaxQ4q', 'fix-git__VwfkxuQ']",3,"[330.479175, 380.362449, 900.95335, 151.432391, 482.476693]","[92.511515, 39.838273, 63.915772, 22.518269, 53.971818]",0.6,True,"['1cfce4b8-cfdf-408a-acf7-c3b9497cbb72', '5e5bf6ea-c454-4c8c-b20f-aa5e662b6415', '578f6b33-23dd-4fdb-bbcb-a7ae0349bb6d']" +gpt-5-mini,fix-ocaml-gc,5,"['74c6cc0c-f59c-436b-adbb-4c1781960e95', '6f4f0cc9-386f-4f13-9c3a-7ff6266dfe75', '3d6d09c9-79e2-443b-81d6-faae4f95ece1', '4b9a2d74-74c1-4921-929d-f390577ac6b4', 'd42cef3c-b8c4-42f2-8918-7f3aa1c6ce9e']","['fix-ocaml-gc__ZKXfVot', 'fix-ocaml-gc__iQ5ym2G', 'fix-ocaml-gc__PvhVxjz', 'fix-ocaml-gc__7xd6W8K', 'fix-ocaml-gc__zRokSLw']",0,"[3602.311654, 3600.000779, 3637.845316, 3605.146151, 3755.150004]","[231.206674, 33.486211, 37.646934, 60.05811, 16.835302]",0.0,False,[] +gpt-5-mini,form-filling,5,"['79944840-cfee-4e24-adb3-640e801c0be5', '4a198c09-9a36-431c-8b87-9bfec3e599a4', '0ed43a97-778c-433d-b238-7855ec636746', '82e5ca76-e88d-4512-ab10-463cd62c7ed4', 'bb4e93a3-bf83-4472-90e6-036592476b29']","['form-filling__XbQBd5z', 'form-filling__aBcU2SQ', 'form-filling__E8qVRHQ', 'form-filling__GPihETB', 'form-filling__7qfqAgk']",5,"[183.801511, 370.006002, 676.625062, 202.965418, 374.630614]","[42.814643, 5.472927, 63.371772, 19.674814, 9.485481]",1.0,True,"['79944840-cfee-4e24-adb3-640e801c0be5', '4a198c09-9a36-431c-8b87-9bfec3e599a4', '0ed43a97-778c-433d-b238-7855ec636746', '82e5ca76-e88d-4512-ab10-463cd62c7ed4', 'bb4e93a3-bf83-4472-90e6-036592476b29']" +gpt-5-mini,git-leak-recovery,5,"['d84a0485-ebfb-4fc4-ba22-1b893f5e9839', '8ebd1b27-ddc6-4609-9260-53052f563d16', '74885a5e-6fd5-4003-974b-776be6047c09', 'bd0c604e-2fcc-4b5e-bdb6-d66b4f06d8e9', '74c86c47-f47a-495e-b6a3-8eb1cc86fd50']","['git-leak-recovery__qMog5Nu', 'git-leak-recovery__9u67fVf', 'git-leak-recovery__nG6jTvw', 'git-leak-recovery__x2H7y4a', 'git-leak-recovery__DnkZ24k']",0,"[919.619248, 994.094624, 238.546245, 768.21181, 901.421608]","[21.443668, 54.545439, 44.612939, 44.901076, 76.289213]",0.0,False,[] +gpt-5-mini,gpt2-codegolf,5,"['1a70ae1a-a9e7-428c-a762-8ef33b77657b', '897b72b3-14fc-4e17-98cd-dc940b49d36f', '03c9965e-f232-4a99-9540-c9a41c6f9148', '15ff763f-29f4-4ca5-ae72-b82a10cdf2dd', '5780953a-ea1a-49eb-b8d6-84f7b1053b33']","['gpt2-codegolf__BpenUuM', 'gpt2-codegolf__iyN8P3h', 'gpt2-codegolf__rZjxHGd', 'gpt2-codegolf__eKT5Xpa', 'gpt2-codegolf__4KrBhPH']",0,"[238.689972, 436.186051, 124.154593, 119.737154, 177.836258]","[238.429009, 193.156238, 105.69496, 37.115351, 105.044528]",0.0,False,[] +gpt-5-mini,hf-model-inference,5,"['42850ca1-2721-48a4-9b6b-0f8038c9dc04', '4c648cc5-b1de-4b3b-9bbf-e5f67ad51931', '18603003-dfaa-4b0c-bf90-27e91925acc7', '81b5d0ef-a117-40a7-89b2-feeb63b7af14', 'c03593c0-988e-4682-a474-725c9690b785']","['hf-model-inference__jMcU4Xg', 'hf-model-inference__hX3PTDj', 'hf-model-inference__keVZkTF', 'hf-model-inference__FrJGmTh', 'hf-model-inference__xBB5poN']",4,"[245.669061, 255.82004, 339.060156, 172.569239, 505.853509]","[35.957157, 66.527682, 32.316686, 61.306021, 48.335541]",0.8,True,"['4c648cc5-b1de-4b3b-9bbf-e5f67ad51931', '18603003-dfaa-4b0c-bf90-27e91925acc7', '81b5d0ef-a117-40a7-89b2-feeb63b7af14', 'c03593c0-988e-4682-a474-725c9690b785']" +gpt-5-mini,install-klee-minimal,5,"['8309d400-74b4-4c07-9df7-7c5d749202ea', 'e6ca1f78-1b81-496f-8043-b1114189bb1d', 'ed80baff-a9c9-4ae3-8c34-ca917dddbf67', 'ad24cf0d-4b7a-4c92-b132-9e073ff1e419', '78863453-ab9c-49be-96e2-1b4c3270122d']","['install-klee-minimal__jDbEogp', 'install-klee-minimal__SSgVSDs', 'install-klee-minimal__EeK5ihw', 'install-klee-minimal__jAa7pcM', 'install-klee-minimal__DHvWKkR']",0,"[900.035298, 900.615276, 900.000808, 834.16108, 903.03984]","[96.685586, 71.308713, 75.441674, 74.748812, 67.097029]",0.0,False,[] +gpt-5-mini,install-windows-3.11,5,"['3532584f-cbd8-4005-83ae-a72d4331b47d', 'e38e2f6a-fa9c-46ee-8e52-aac36a14d442', '98225b59-8672-4294-acde-adecde6f1714', 'e7f6165f-9db7-434c-ac63-ee63fba32ab9', '1e19fede-14d5-46ad-9041-adf5936b595e']","['install-windows-3.11__rFAr885', 'install-windows-3.11__HYioejG', 'install-windows-3.11__gza7rFL', 'install-windows-3.11__aFG3fCE', 'install-windows-3.11__FUKRuGH']",0,"[366.33384, 348.12997, 1116.303841, 266.145285, 618.915039]","[64.435813, 12.802095, 70.397795, 56.789515, 35.61758]",0.0,False,[] +gpt-5-mini,large-scale-text-editing,5,"['1c09673c-966a-4744-9bfd-040cf0badc26', 'b9e62e60-c9f5-4fbd-9126-92ba8a0de0c6', '8220946e-12f7-4fb8-908e-43039408601e', '84d96793-9bc5-402e-b454-bec71180bfd8', 'e317f8df-d9d0-4d85-ad81-ff38b60a451e']","['large-scale-text-editing__v6uNHBf', 'large-scale-text-editing__4T8zMzK', 'large-scale-text-editing__9xwZ2oh', 'large-scale-text-editing__tjLC8b4', 'large-scale-text-editing__bYJuThT']",1,"[1211.098618, 1208.139785, 146.349982, 1222.926937, 1200.02821]","[90.300434, 102.996453, 40.225996, 14.983364, 24.032667]",0.2,False,['e317f8df-d9d0-4d85-ad81-ff38b60a451e'] +gpt-5-mini,largest-eigenval,5,"['3dab981b-4fff-4807-9f12-01005f0e3517', '3daab2bb-9f6c-4a3f-aae5-96054b8a365c', '5f761415-d533-4866-bc22-f2e2a7ed409b', '0d0bb73f-14e6-46c7-bd37-aefdad3d17ab', '75b1b712-5faf-4445-898a-0e9c29bb719b']","['largest-eigenval__aMPmZ4n', 'largest-eigenval__582tBB5', 'largest-eigenval__nrW6pFm', 'largest-eigenval__Nnz3s6w', 'largest-eigenval__63A6ek5']",0,"[919.798709, 950.066419, 924.020696, 900.195707, 902.54655]","[134.280502, 40.693415, 38.025701, 28.753057, 40.887896]",0.0,False,[] +gpt-5-mini,log-summary-date-ranges,5,"['167f9707-2009-463e-aac0-23434c79828a', '9efc1715-dc10-43ab-894c-5760b5bc96f2', 'a4cbeb86-4009-4b86-90d9-4f15d5fe82d9', '69895dee-1d12-4a7a-860d-48edc587ac27', 'df359dc5-3a10-4473-8604-e77d0b4a7213']","['log-summary-date-ranges__SRFRtdY', 'log-summary-date-ranges__gq7UspZ', 'log-summary-date-ranges__fgpNQqJ', 'log-summary-date-ranges__dfHDdi5', 'log-summary-date-ranges__z37YmVz']",0,"[136.758542, 115.511487, 128.262776, 73.332209, 94.414215]","[30.758001, 59.100098, 22.892032, 90.060555, 170.263386]",0.0,False,[] +gpt-5-mini,make-doom-for-mips,5,"['f26b6302-64ae-4827-9819-be33dfdd6614', '17fe88ee-476b-4399-9160-163d1a4d6018', '1030e132-a2cc-4bde-b03e-ea3d8d6ee380', '7ad260af-21cf-4f97-9c8d-962491daeebe', '0d33b75d-e4ab-45c6-8530-08016f44cf24']","['make-doom-for-mips__RbKstcr', 'make-doom-for-mips__bitufEX', 'make-doom-for-mips__TJ85jZ4', 'make-doom-for-mips__Z5Moibm', 'make-doom-for-mips__7bE4vQw']",0,"[908.727245, 906.577662, 902.864994, 903.196624, 915.411897]","[90.976869, 37.870474, 213.308127, 112.17527, 23.358155]",0.0,False,[] +gpt-5-mini,make-mips-interpreter,5,"['a628dc9f-e642-4e48-a358-03e66c2a5d9f', '2800688d-d825-43c9-9584-d6441e64b32a', 'a5b128fd-ae8c-4096-a1d9-652883d27b90', 'db525db7-157f-49e2-bf25-739f60dc2e52', 'cc026822-871a-4d12-b177-572404bf869b']","['make-mips-interpreter__6kNtfzi', 'make-mips-interpreter__WviHnoo', 'make-mips-interpreter__NDAH6kC', 'make-mips-interpreter__UVavDqU', 'make-mips-interpreter__oTJ3GHc']",0,"[1808.065558, 1830.205166, 1801.298598, 1800.005615, 1105.170292]","[112.742323, 27.049152, 31.085021, 57.109366, 27.234246]",0.0,False,[] +gpt-5-mini,merge-diff-arc-agi-task,5,"['7eb30c3d-3cca-4767-8f0c-3b5178e84dda', 'd3a6f04d-14e8-4ff4-9dc6-0abd8dfbd2a0', '2fdd2d38-9517-4155-8476-f0f16316c48b', '749c9a3b-f330-423b-b22c-1dce67dfb7a5', 'f2aeee12-653d-43d5-8933-36a440239f2a']","['merge-diff-arc-agi-task__tDxFbCY', 'merge-diff-arc-agi-task__6HgAdyT', 'merge-diff-arc-agi-task__GaW4vWu', 'merge-diff-arc-agi-task__5gATJQF', 'merge-diff-arc-agi-task__DAuY5MR']",2,"[247.340679, 909.820458, 587.371606, 906.533537, 979.610297]","[19.968332, 104.537661, 12.806951, 195.924316, 79.391461]",0.4,False,"['7eb30c3d-3cca-4767-8f0c-3b5178e84dda', '2fdd2d38-9517-4155-8476-f0f16316c48b']" +gpt-5-mini,model-extraction-relu-logits,5,"['86b0af8c-30e0-449b-9cc1-fb379c5a4a64', '666c604c-9a58-454d-9f70-fafdaa8233bc', '6271509b-0b07-4d76-a653-3cc1c187a6d9', 'e434385a-a6fb-47b3-8186-f6955d2df967', 'e223545b-6ae5-4184-9871-d0a4cb936399']","['model-extraction-relu-logits__KZ4NwZw', 'model-extraction-relu-logits__ASEPfaU', 'model-extraction-relu-logits__d3a5HKD', 'model-extraction-relu-logits__7Zx9oxJ', 'model-extraction-relu-logits__5jEb6xs']",0,"[931.484553, 431.490574, 327.181601, 138.091196, 219.411444]","[19.06601, 128.184384, 38.128588, 37.807678, 15.441476]",0.0,False,[] +gpt-5-mini,mteb-leaderboard,5,"['6c0adec2-25b3-484d-9bb6-ab8486aba1fe', '52b01561-521e-4cf5-bf56-e9072b67c238', 'e32f2f33-7357-44c4-bbfd-ffc05f06fc59', '87411c9e-fe61-4e2a-b3a6-bf00a76f97de', 'e77fe3c6-debb-4364-a6c1-1b2ba7e3183b']","['mteb-leaderboard__3H9hand', 'mteb-leaderboard__QyV4LAd', 'mteb-leaderboard__QxbH3pf', 'mteb-leaderboard__XbucArH', 'mteb-leaderboard__FvHGizk']",0,"[3600.507909, 3602.489237, 3608.335784, 271.216223, 3630.417158]","[19.713715, 4.454326, 5.533454, 19.137947, 75.745503]",0.0,False,[] +gpt-5-mini,mteb-retrieve,5,"['0e2711e5-345c-4aaa-8afe-0d6d7c44d441', 'c48b4a1f-c678-4ffd-9789-0f90e13c8252', 'ffa9d467-0c7f-459c-9325-00e41e45acca', '70f05a09-70ae-4d8d-969e-aeee76119580', '24cb400d-b6db-4242-9329-4229e85f85ba']","['mteb-retrieve__rxGXZzu', 'mteb-retrieve__da7ZMUh', 'mteb-retrieve__gT22Ug6', 'mteb-retrieve__f8WimBG', 'mteb-retrieve__NBsHdDd']",0,"[290.868252, 369.050504, 196.847309, 628.823794, 412.934795]","[32.392143, 16.638475, 18.669547, 2.307594, 43.144231]",0.0,False,[] +gpt-5-mini,nginx-request-logging,5,"['83043e4e-97ee-4b66-b7c2-c57d6042fef3', '4eed7fe9-f3bc-415e-8e20-47e7d14fec5a', '1054c334-ecb1-4b78-a16a-47f17890bc15', '9bd387da-9efa-4fd7-a3e7-28af561bc6a5', '62a80648-5f1e-4b66-a738-227919c138cf']","['nginx-request-logging__AyNzrcn', 'nginx-request-logging__BNeLLzs', 'nginx-request-logging__8XNgQZw', 'nginx-request-logging__EJJkf4H', 'nginx-request-logging__67tePaD']",2,"[177.985975, 285.525567, 130.411973, 335.965284, 200.33012]","[58.098066, 42.077755, 18.024077, 61.416474, 26.242354]",0.4,False,"['4eed7fe9-f3bc-415e-8e20-47e7d14fec5a', '62a80648-5f1e-4b66-a738-227919c138cf']" +gpt-5-mini,openssl-selfsigned-cert,5,"['36f1367f-d655-41a7-b322-4ea5f1cffa6b', '2167e733-500c-45aa-9997-cad189d45c77', 'ae0c8810-8e4f-496a-9ca7-9e72d8046bb5', 'd839a4cb-e28c-48da-98ef-2b7f389cb7b7', 'ab1cd615-7d12-4d12-9e38-574737f9a20e']","['openssl-selfsigned-cert__srHrFCd', 'openssl-selfsigned-cert__HGD2RYt', 'openssl-selfsigned-cert__vv3qmDn', 'openssl-selfsigned-cert__ocCnzDc', 'openssl-selfsigned-cert__kq6dthk']",4,"[218.155395, 149.276407, 197.233028, 224.869563, 126.935502]","[34.524047, 92.243769, 44.865905, 71.889656, 27.837295]",0.8,True,"['36f1367f-d655-41a7-b322-4ea5f1cffa6b', '2167e733-500c-45aa-9997-cad189d45c77', 'ae0c8810-8e4f-496a-9ca7-9e72d8046bb5', 'd839a4cb-e28c-48da-98ef-2b7f389cb7b7']" +gpt-5-mini,password-recovery,5,"['808cac95-e8ad-44e6-871c-2e0cf4f40e00', 'c12db0fb-59fb-409f-8a42-3e9aa3a207e2', 'f6c2aae5-9a7c-4670-9fcc-51c0a8a8f1f5', '0c0eb696-3be6-4d9e-b476-f1ced16e7bbb', '3f115726-dbd1-4d21-8c8f-2a8352231d72']","['password-recovery__z7VMQaA', 'password-recovery__DV8GXZf', 'password-recovery__5oRbBKg', 'password-recovery__W6fcvFH', 'password-recovery__YkggkKL']",0,"[909.924695, 915.622287, 900.104368, 900.010141, 1666.523669]","[50.853044, 56.596423, 27.968271, 18.977335, 45.984434]",0.0,False,[] +gpt-5-mini,path-tracing,5,"['ff51f94c-37d8-43ba-8c47-df32a70b6048', '9ea7eb98-e1a0-458a-a270-fae9c246ab5e', '773bcf4d-23c0-458c-967e-6e463509bf6e', 'bba8477f-3e10-4127-b27f-04ab32196270', '8611152e-9f91-407f-8eac-4ecee1ac7911']","['path-tracing__SHN6hXn', 'path-tracing__ZfibSHG', 'path-tracing__PqKBCu4', 'path-tracing__mGZ2t8L', 'path-tracing__6iwWdcC']",0,"[853.573439, 1555.892007, 1100.400333, 1809.692491, 1800.063195]","[86.543789, 97.601047, 15.189155, 28.310998, 33.347009]",0.0,False,[] +gpt-5-mini,path-tracing-reverse,5,"['d1e0f468-3b22-4fbf-8c21-d314570033a4', 'd824c6a6-bce5-4eb8-a196-6c4acb3c226a', '14206059-cb45-4e40-a1b7-b55478198a4a', '001b8ead-4a37-47e4-9737-34ca951949fb', '5e5ed07e-9e6c-4ba0-b3b8-2f2573b48cb7']","['path-tracing-reverse__49HLB2u', 'path-tracing-reverse__FrLdbHr', 'path-tracing-reverse__ERyQp5T', 'path-tracing-reverse__UUtGJ7u', 'path-tracing-reverse__V962YVh']",0,"[1150.946894, 127.758521, 1803.244462, 1810.15497, 1805.006093]","[136.460861, 41.657848, 25.853253, 51.65925, 76.882266]",0.0,False,[] +gpt-5-mini,polyglot-c-py,5,"['106ed985-8563-417a-8917-f243f52bcc20', 'b66f4645-bfb8-45db-969a-bf08859155f2', 'c255282b-22d1-47b2-a359-a4e70e592ee5', '4cb87081-fb52-408f-aae1-0511cff8c314', '1fc05812-b820-4c06-9bb0-81b75658e7b7']","['polyglot-c-py__QqtRFhv', 'polyglot-c-py__EFMqzZB', 'polyglot-c-py__bz3Gwcr', 'polyglot-c-py__UxuuRd4', 'polyglot-c-py__TT4Czxa']",0,"[317.484834, 900.386915, 900.001983, 900.027405, 390.116905]","[32.513102, 42.516618, 22.889422, 14.561053, 47.564746]",0.0,False,[] +gpt-5-mini,polyglot-rust-c,5,"['2e7251cd-ee3a-49ba-b2c0-62d85843a04d', '1da3c988-7d59-4bd8-a49a-6b9381d56684', 'eaef5204-48b0-4172-9113-61aded1ad775', '4754ee4b-a5b3-47a4-a6c6-1dda46b46f68', '3d5d2d0f-2e5c-47c9-8ab0-38639b16fb49']","['polyglot-rust-c__dLMQxoE', 'polyglot-rust-c__wpUxFZo', 'polyglot-rust-c__avzwVBE', 'polyglot-rust-c__sr8u5h3', 'polyglot-rust-c__y3krsVy']",0,"[900.035667, 906.995784, 919.401645, 901.168655, 440.595907]","[12.778511, 208.641342, 77.498776, 46.169897, 120.849371]",0.0,False,[] +gpt-5-mini,port-compressor,5,"['2a759ffd-5f67-47c7-919c-fc6037c5ba07', '75b38d80-0150-418a-874c-66d755627a38', '6497829f-8449-4139-94c7-0a2c47b7883a', 'c8c48058-b27c-449a-974e-ea78273028a5', '991c71d4-dd46-4f68-bd3e-ab35eb931a52']","['port-compressor__zitZXTU', 'port-compressor__sB7bEwB', 'port-compressor__qGvBJGQ', 'port-compressor__ypH7UDQ', 'port-compressor__PfV3Mzi']",0,"[3603.732211, 3605.167486, 3618.376007, 3607.063215, 3626.957065]","[42.695066, 75.847768, 62.002053, 135.94303, 88.320308]",0.0,False,[] +gpt-5-mini,prove-plus-comm,5,"['ec738d5b-eda5-4824-94eb-4c266247d441', 'b5ebf97b-c60d-46f7-abd8-9adade242286', 'afbe9715-3b4f-4f04-b8a0-c9eec4bbeba7', 'be95abe5-2741-4e76-9a18-923ab1ee9a25', 'c8adcce5-e091-4495-a5df-1078aa0d4142']","['prove-plus-comm__njjkmTM', 'prove-plus-comm__SNbkU2v', 'prove-plus-comm__PNbYwx7', 'prove-plus-comm__uwUR3Es', 'prove-plus-comm__QJRc2Jd']",3,"[170.22793, 208.739091, 100.040451, 93.581642, 172.618389]","[68.192335, 134.464151, 19.422135, 14.194886, 68.637283]",0.6,True,"['ec738d5b-eda5-4824-94eb-4c266247d441', 'b5ebf97b-c60d-46f7-abd8-9adade242286', 'be95abe5-2741-4e76-9a18-923ab1ee9a25']" +gpt-5-mini,pypi-server,5,"['03b407d8-9886-49cc-b381-7f6043245e47', '5c1ae364-88fd-45f3-8965-aed30240426c', '958caf74-cf6f-4618-99d3-e62e7fe3c368', '1483dd49-f1e9-4678-ae57-58b5c745a2e6', '6d479389-503c-43d7-ac63-bc7b14ccff34']","['pypi-server__A6KcZph', 'pypi-server__VxXEZx6', 'pypi-server__GXngFUx', 'pypi-server__9TRK5BW', 'pypi-server__uBFbYuf']",4,"[245.838615, 122.950557, 159.632302, 195.883431, 145.250695]","[103.533689, 171.64155, 25.071511, 36.247554, 52.867635]",0.8,True,"['03b407d8-9886-49cc-b381-7f6043245e47', '5c1ae364-88fd-45f3-8965-aed30240426c', '1483dd49-f1e9-4678-ae57-58b5c745a2e6', '6d479389-503c-43d7-ac63-bc7b14ccff34']" +gpt-5-mini,pytorch-model-cli,5,"['cfb5cedd-b5b0-4924-9646-1a0336e467e6', '5dd26334-3994-44f9-8a89-2301ddbf7ef0', '54403f84-3b58-48c6-909c-010287f2e715', '5c84767c-a92b-4372-96f7-214d4101cb79', 'd9d9cfc4-805c-44ad-adb4-f5f469253c62']","['pytorch-model-cli__aAbxoVe', 'pytorch-model-cli__4UpBnmh', 'pytorch-model-cli__ejD4c8m', 'pytorch-model-cli__VHQZjGP', 'pytorch-model-cli__LiRjRfL']",0,"[181.859916, 91.107201, 124.677858, 178.311842, 264.966923]","[71.508896, 95.873162, 65.451483, 134.142992, 79.132656]",0.0,False,[] +gpt-5-mini,pytorch-model-recovery,5,"['fa540284-c635-43d8-8eb0-e7e180023adc', 'a141156f-5a4b-46e9-b721-5623069e0a11', 'db55bf01-f713-42c4-a6c4-787628b7e419', '23209f71-78f2-4b62-994b-8000a97430c8', '1c5ab240-e32c-48b1-a66a-af9be0cd584d']","['pytorch-model-recovery__qafQutu', 'pytorch-model-recovery__QXwiZRw', 'pytorch-model-recovery__2nBA2mC', 'pytorch-model-recovery__HPrS8EV', 'pytorch-model-recovery__zMEnXW7']",0,"[809.873501, 297.503929, 825.620966, 402.367435, 855.838254]","[51.379534, 59.496172, 54.581608, 13.831032, 57.512892]",0.0,False,[] +gpt-5-mini,qemu-alpine-ssh,5,"['bdfa877a-433c-4afb-a33b-ce1d239fc818', '4607115f-432f-4e0e-bece-d5d02e19497b', '879cef1a-291d-41ff-8e8b-723d9443e3ba', '2ea574ab-99de-4328-b1f0-1ab5cfb797fb', '3c41ab80-d074-481a-b65a-626587d4a050']","['qemu-alpine-ssh__cikJuJL', 'qemu-alpine-ssh__NncR6sW', 'qemu-alpine-ssh__uAcQYuv', 'qemu-alpine-ssh__Ua7WnHb', 'qemu-alpine-ssh__6ozD2s9']",0,"[900.116404, 982.850539, 941.082539, 401.584648, 304.586518]","[9.353925, 13.478103, 12.862614, 22.889168, 15.497805]",0.0,False,[] +gpt-5-mini,qemu-startup,5,"['58af9857-e3f3-47f7-b901-253f35c7eed7', 'c431d136-1735-4b85-bbd2-beded79c9b39', 'f64e8006-7154-4174-a5b1-e8a638325b27', '17466622-3065-468c-8b9a-4c64fbda183b', 'e667f95a-a7d4-4822-a860-c719a3ad8e1d']","['qemu-startup__evs5F5k', 'qemu-startup__BqLXoQK', 'qemu-startup__5Sy2vWu', 'qemu-startup__rxL8r42', 'qemu-startup__RNrAfq6']",4,"[649.734081, 812.293778, 489.802463, 267.37671, 437.319814]","[8.863418, 3.516766, 30.451074, 16.881587, 7.435812]",0.8,True,"['58af9857-e3f3-47f7-b901-253f35c7eed7', 'c431d136-1735-4b85-bbd2-beded79c9b39', 'f64e8006-7154-4174-a5b1-e8a638325b27', 'e667f95a-a7d4-4822-a860-c719a3ad8e1d']" +gpt-5-mini,regex-log,5,"['3912ab41-b86a-478e-a5af-995eabc2ce0d', 'd4fbfa17-af3b-434f-a6d5-8ab775139c52', 'ad4f1c3e-1869-48f7-87f0-9886d79df776', 'e87af172-92a2-4816-bdc2-d2026892fa9c', '6e732d84-7754-4fd3-9334-2f14417da6c3']","['regex-log__itrDdhH', 'regex-log__Trr3TMg', 'regex-log__HVYH2WX', 'regex-log__gwTzAio', 'regex-log__xYEmqco']",4,"[173.350422, 171.2817, 163.535429, 105.204183, 116.841801]","[106.846252, 25.178794, 35.540097, 157.28424, 263.250885]",0.8,True,"['d4fbfa17-af3b-434f-a6d5-8ab775139c52', 'ad4f1c3e-1869-48f7-87f0-9886d79df776', 'e87af172-92a2-4816-bdc2-d2026892fa9c', '6e732d84-7754-4fd3-9334-2f14417da6c3']" +gpt-5-mini,reshard-c4-data,5,"['5956c3d0-735d-436a-896c-fa99ec7b8f72', 'b7338317-329c-4329-a0a5-92c844ba3ec8', 'dd953812-6179-4c1c-9d14-ed0d9f17605e', 'baa7af25-5148-4ef8-b191-e85a7343bd34', 'c28489cf-9ab3-4f4d-a0c9-518ff98323e7']","['reshard-c4-data__GTnPjU3', 'reshard-c4-data__eZzfRVK', 'reshard-c4-data__RcCdECu', 'reshard-c4-data__uUoJGAZ', 'reshard-c4-data__PyHWZXS']",0,"[486.908328, 784.104237, 200.233277, 763.051196, 301.946198]","[49.3141, 66.942211, 111.121123, 189.890614, 62.920592]",0.0,False,[] +gpt-5-mini,reverse-engineering,5,"['003b211c-0f55-453c-ba5a-1d22b4d3bd96', '97e3683b-adaa-4f8a-87e9-0b43f3566e90', '2c5e55aa-a6b7-41c0-b558-ea35d34dab06', 'c4b5e27a-f695-47a5-9927-a5b079f43212', '01023f31-1cd1-4510-9f53-ae5ce6016211']","['reverse-engineering__acRQmdQ', 'reverse-engineering__jCaVWLc', 'reverse-engineering__Kb5MjF3', 'reverse-engineering__tnrDJFm', 'reverse-engineering__Emc7zr6']",0,"[1800.564711, 2071.097966, 7832.939551, 1800.059452, 1371.185391]","[73.163206, 13.889842, 21.925515, 18.048645, 38.893149]",0.0,False,[] +gpt-5-mini,run-pdp11-code,5,"['c3b7988a-8d10-436b-8773-043aec47950b', '9f4d21d1-32f3-4b7d-9aa2-6cfff96c74c8', 'f79ce026-eb9b-4345-8080-0e7dacc9bffb', 'ed4dfded-1486-4b8b-85d8-c50e61dbbe0b', '96844e5c-2ba0-4a39-a429-c059b6188e1d']","['run-pdp11-code__DZagfbV', 'run-pdp11-code__EGBBGAM', 'run-pdp11-code__XS8X3Fc', 'run-pdp11-code__N8buH8i', 'run-pdp11-code__LnmVcGf']",0,"[258.077195, 693.143545, 222.067762, 1122.815201, 1028.420196]","[68.298277, 86.927407, 36.155018, 86.370905, 118.896286]",0.0,False,[] +gpt-5-mini,sanitize-git-repo,5,"['735c598a-47dd-4a40-a38b-f6951de5eb81', '8edecf4d-e355-4abd-844f-031f1aabdbe2', '7b644390-94b0-4030-adb6-af2419227c78', '5391de27-0405-427e-b375-f08e4d6bc31c', 'c5916c9e-6a5c-4039-a38b-580fe23ed69e']","['sanitize-git-repo__WieC6Yq', 'sanitize-git-repo__FasCaCQ', 'sanitize-git-repo__EUWHKKh', 'sanitize-git-repo__DQVSr5b', 'sanitize-git-repo__qf5fQgs']",0,"[1002.411864, 207.200411, 900.37908, 255.859868, 900.597739]","[140.286295, 20.816512, 42.816441, 52.475003, 78.025958]",0.0,False,[] +gpt-5-mini,schemelike-metacircular-eval,5,"['b863236d-e4ad-4172-87df-cf19becc41e8', '7952c808-a1db-4615-abcc-af01073c3d7d', '00a50e6c-0380-4a26-a608-9a5f7d36f3bc', 'be6cf86b-4f26-4f55-b971-cf2c087f8727', 'e7b5c0c1-5e6a-4637-a7a6-ca4c7cbfbf5b']","['schemelike-metacircular-eval__76KV49x', 'schemelike-metacircular-eval__8EQj5zj', 'schemelike-metacircular-eval__zuuqbVZ', 'schemelike-metacircular-eval__UuXsky2', 'schemelike-metacircular-eval__eJzoqaH']",0,"[2424.501503, 2400.032071, 2410.55378, 2428.968544, 2413.828432]","[80.423159, 84.855072, 41.129756, 13.103847, 90.968006]",0.0,False,[] +gpt-5-mini,sparql-university,5,"['6085883a-4110-4a6a-ae71-c0ee2b946f65', 'ff2984fe-8406-4aa9-9988-26b6919961fd', 'e6b2a61f-ec42-4867-af51-4563257f6369', 'a9479dd6-30e5-445c-a333-616e0e505c1f', '47ab7c53-5dbb-4629-9b88-49ee1b5ece50']","['sparql-university__Nd7yPuN', 'sparql-university__PpugiW8', 'sparql-university__tKa2zUw', 'sparql-university__csaRkXe', 'sparql-university__T5wERuf']",0,"[499.63291, 305.642809, 171.778461, 263.766192, 646.661874]","[73.942749, 55.078882, 76.950412, 42.749228, 161.623463]",0.0,False,[] +gpt-5-mini,sqlite-db-truncate,5,"['30b5565a-1a21-4fdf-b65a-68bfe7e2b7e8', '9dbc4e35-7a0c-4fc8-97d6-752f323d4045', 'cc1ef134-4987-46d1-bc2d-2913800c592c', 'a722efb7-642d-4194-9b04-050b6555a778', 'b0d9a714-3594-415d-98b4-a57b2e740f26']","['sqlite-db-truncate__BqTZyUi', 'sqlite-db-truncate__SvTAqgn', 'sqlite-db-truncate__iCKYDVG', 'sqlite-db-truncate__XVLSVJJ', 'sqlite-db-truncate__ARrSk3S']",0,"[473.371433, 338.799654, 68.423957, 308.129346, 277.396603]","[69.766731, 23.073803, 34.294368, 42.420904, 16.028348]",0.0,False,[] +gpt-5-mini,sqlite-with-gcov,5,"['57303bba-1dfd-4066-9e6c-fddc15cebf31', '420d2f38-43a9-4e50-bf8b-06c33d314efc', '393aecfc-6744-4752-9862-b9ee75b6321d', 'e8bf67b0-cf20-4ea3-9fe3-c133bb80eb11', 'a03f6da2-4b7e-491c-9a75-e32c940eb0cc']","['sqlite-with-gcov__h6umDGt', 'sqlite-with-gcov__39misKK', 'sqlite-with-gcov__X63n2Nw', 'sqlite-with-gcov__jxwyxet', 'sqlite-with-gcov__7QzGxHQ']",5,"[299.261982, 608.153945, 244.830021, 509.833187, 179.188808]","[62.645392, 36.565469, 43.059659, 90.825313, 36.175995]",1.0,True,"['57303bba-1dfd-4066-9e6c-fddc15cebf31', '420d2f38-43a9-4e50-bf8b-06c33d314efc', '393aecfc-6744-4752-9862-b9ee75b6321d', 'e8bf67b0-cf20-4ea3-9fe3-c133bb80eb11', 'a03f6da2-4b7e-491c-9a75-e32c940eb0cc']" +gpt-5-mini,torch-tensor-parallelism,5,"['0eeefc2e-c78d-4a36-b887-ca0fc0f0e4f9', 'f0867060-a089-4411-b006-491b8f2c45c0', '0bfd7a2c-b5c7-4d53-b7bf-383e2215e8ff', '19665595-97d4-435b-b595-bcf3f2948477', '47a204fe-4d6d-4bd1-972a-af0702c21f5d']","['torch-tensor-parallelism__vDMhDaz', 'torch-tensor-parallelism__mn3reNs', 'torch-tensor-parallelism__4pWSaS9', 'torch-tensor-parallelism__MycGyin', 'torch-tensor-parallelism__XT5h2n5']",0,"[93.839999, 86.937252, 240.651863, 186.701528, 116.723887]","[65.936561, 46.87759, 57.209021, 104.582351, 19.445879]",0.0,False,[] +gpt-5-mini,train-fasttext,5,"['1f79a6b8-e72d-48d1-be74-f0fae5d6c03e', '5a891410-2c6b-4a56-9686-78ff09d5baf3', '4781e186-090c-4f11-9287-aa75f1b12340', '881fae9e-c548-4717-acdd-31c16fa7e373', '6bcf674f-bb23-4e8a-8097-7e4e619ee316']","['train-fasttext__vn4QqCg', 'train-fasttext__hAqtsJD', 'train-fasttext__2P3NnCC', 'train-fasttext__W9BgUjF', 'train-fasttext__MdrP7VH']",0,"[3648.149359, 3627.221369, 3606.12247, 3624.579383, 3615.210222]","[23.427869, 47.642571, 38.418924, 32.84351, 34.961033]",0.0,False,[] +gpt-5-mini,tune-mjcf,5,"['197474e1-66e3-4831-bff5-7780c42bce68', '7bfe3c5b-0efa-4113-a9de-8eb82f1bd119', 'b6ca23b6-7f97-4085-9849-9162911f17ac', 'e4304038-2fb4-4b21-9153-7ce10fda6a58', 'd1881caf-a6bf-4f24-b6d6-92e4701c9f2d']","['tune-mjcf__wbfkHzm', 'tune-mjcf__gaSNPQu', 'tune-mjcf__cQFoyCN', 'tune-mjcf__qp9dtvC', 'tune-mjcf__77k94iY']",0,"[945.399334, 900.151864, 924.84925, 900.114155, 908.167712]","[24.235561, 76.580259, 68.102191, 9.806463, 14.825552]",0.0,False,[] +gpt-5-mini,video-processing,5,"['7d78d8a6-db09-474e-8ffa-19759b4d87d4', '2660b19a-84a4-4565-a735-807347fc7c0e', '6c714c28-5c82-47fc-887b-1d7a48ebc385', '2049d7fa-ee61-482a-815c-b65da781924b', '7ce8439a-a147-418c-b2d0-01e121161cb9']","['video-processing__N6UbNTc', 'video-processing__qMtFTfQ', 'video-processing__2VLpBBy', 'video-processing__hxwTcUV', 'video-processing__CuY7SgP']",0,"[143.299369, 288.7109, 251.469578, 217.833027, 238.627674]","[42.767885, 51.999654, 87.022307, 37.206264, 35.61172]",0.0,False,[] +gpt-5-mini,vulnerable-secret,5,"['cf5c2cd8-43c5-416b-a586-96427ffaa0d8', 'b78ba586-46ce-4453-bc32-64c8a4403906', '26777cb4-a28f-463a-a1d1-d98648b3805a', '6ff97d3e-14fe-4934-8945-cc795cf037e3', '696475cc-0591-4ef0-8b6f-21b644a9277a']","['vulnerable-secret__NgzwMTP', 'vulnerable-secret__2N96XiM', 'vulnerable-secret__FETzFR7', 'vulnerable-secret__DGwhhZs', 'vulnerable-secret__SWbPxG8']",2,"[904.657216, 904.559886, 810.772388, 911.579853, 446.983423]","[25.657871, 72.452098, 8.918145, 54.029205, 66.443999]",0.4,False,"['26777cb4-a28f-463a-a1d1-d98648b3805a', '696475cc-0591-4ef0-8b6f-21b644a9277a']" +gpt-5-mini,wasm-pipeline,5,"['bae9db50-5600-4448-aea3-91ab014cbe7e', '055fa93a-23d9-4288-bddb-ee846c467655', '7a93d903-572d-4a46-a2a5-2f0d113bc701', '52831039-8329-4868-b3f9-9b87fe32e787', 'c858668d-b216-41b7-8947-f09500bf25f7']","['wasm-pipeline__QoxxD9i', 'wasm-pipeline__LD9wcYs', 'wasm-pipeline__cvQJuiL', 'wasm-pipeline__xhMeQ92', 'wasm-pipeline__KpM4GKX']",3,"[318.65126, 322.877102, 911.05486, 474.52876, 140.835801]","[4.520398, 16.11399, 4.42517, 10.907106, 13.608961]",0.6,True,"['bae9db50-5600-4448-aea3-91ab014cbe7e', '055fa93a-23d9-4288-bddb-ee846c467655', '52831039-8329-4868-b3f9-9b87fe32e787']" +gpt-5-mini,winning-avg-corewars,5,"['d9d4c2a0-b05b-47a5-8a87-0c9ae741b314', '7ce97d43-01cf-4953-b4c4-1b74a5c0bc71', '5b0aa2fc-0690-4264-a5cc-c6765b323c32', '92d2235e-1fb7-46aa-8c1c-449e6cca542c', 'dd610535-9494-4088-8663-f97f44054c1b']","['winning-avg-corewars__Kbvbu99', 'winning-avg-corewars__DJv5YZZ', 'winning-avg-corewars__TsHQN69', 'winning-avg-corewars__FraPS5r', 'winning-avg-corewars__BV6h6nR']",0,"[3600.046057, 3889.13686, 3624.57897, 3619.603306, 3607.859696]","[64.499009, 4.848878, 180.106591, 41.729013, 24.991598]",0.0,False,[] +gpt-5-mini,write-compressor,5,"['45b4f001-68c4-4ba2-a015-e81dd85d9ed3', 'ec7e1452-1173-4307-9cc5-a079226c594b', '63abacd9-b87c-477c-9ad5-d18cdbf1ebaf', '93830b35-6659-4631-9344-df06c2c6138c', '59bdc1c2-acd2-4f71-be3a-1c07605eabf0']","['write-compressor__JoYumM7', 'write-compressor__4qf3FUR', 'write-compressor__97kt7k5', 'write-compressor__KBnAgdN', 'write-compressor__SMSsJjW']",0,"[272.563807, 200.739629, 793.427209, 902.392981, 111.409613]","[41.204548, 19.270107, 43.611572, 80.034516, 27.967901]",0.0,False,[] +gpt-5-nano,adaptive-rejection-sampler,5,"['a303cc65-3e71-4a94-b4d6-59f9ca84cec7', 'd412527e-84c7-460b-8524-d501c01f142b', 'bbee7837-49da-4fba-be76-0fcd667ea4b9', '0bad16b2-12e7-4559-8263-1f5a1bb08fce', 'ce940096-d8c0-403b-9396-592a8fac5261']","['adaptive-rejection-sampler__qXDFkwz', 'adaptive-rejection-sampler__VGur2ZQ', 'adaptive-rejection-sampler__38UJ97f', 'adaptive-rejection-sampler__qnjr4iZ', 'adaptive-rejection-sampler__zXfdj2E']",1,"[818.893071, 902.897538, 900.491184, 332.455199, 901.720344]","[137.686176, 79.602128, 43.999761, 75.731599, 57.232212]",0.2,False,['a303cc65-3e71-4a94-b4d6-59f9ca84cec7'] +gpt-5-nano,bn-fit-modify,5,"['0fde5abe-52f2-40d9-ab14-cf9c19ae97e1', 'fc5b3318-05be-4b14-a2da-dc0bf1354ea1', '1ca213e3-36ef-40ee-8a6b-56961e985a7a', '59691d87-6fbe-43f6-830a-d285dc5fcfb6', '4ea250c0-8e1e-461c-a791-9a56a095bedb']","['bn-fit-modify__SgeSKJ5', 'bn-fit-modify__MN3mHJY', 'bn-fit-modify__vhobSAv', 'bn-fit-modify__JjNHAGP', 'bn-fit-modify__vbnEcqw']",0,"[542.463067, 3637.301526, 918.295451, 385.591483, 479.923244]","[83.871491, 70.459368, 28.534253, 271.673549, 228.630744]",0.0,False,[] +gpt-5-nano,break-filter-js-from-html,5,"['327bde72-5b7b-4893-969e-35afdda9ad37', '54795e28-9d40-49a7-b026-4e457999adf4', 'f36374c1-4cc5-4fdd-83d8-b731374dedcd', '3300c18c-ecca-4ad4-9967-1669897be8ee', '41f87aee-0fc6-46ac-ab22-e27d65a7d3d3']","['break-filter-js-from-html__dUf2HYE', 'break-filter-js-from-html__RnRZyTw', 'break-filter-js-from-html__x64Qnz9', 'break-filter-js-from-html__4PNwsnY', 'break-filter-js-from-html__4zdSNoq']",0,"[1200.074658, 1213.599301, 1214.065029, 1254.933754, 1200.937706]","[78.351177, 100.667928, 55.736499, 163.546765, 11.673694]",0.0,False,[] +gpt-5-nano,build-cython-ext,5,"['ee6c422e-845d-4fc0-baef-bc302c0d2430', '12e96ba6-7a79-49b8-b4ce-d963f3473624', '835a0073-3d85-44db-87d2-4f72b5ff4bfe', '3ef19d39-df32-499c-a71c-2ee8e6e194f9', '17383441-63c8-4da8-b4b7-4dacc9972b22']","['build-cython-ext__fwy3yhb', 'build-cython-ext__gdNLvpj', 'build-cython-ext__fdWfV7F', 'build-cython-ext__Q573BYD', 'build-cython-ext__xzxGTfA']",0,"[904.101111, 922.466644, 919.813052, 911.589764, 960.328104]","[134.925099, 32.086984, 79.123766, 74.222473, 36.325552]",0.0,False,[] +gpt-5-nano,build-initramfs-qemu,5,"['ff385be5-f800-4056-8b58-f3ea781588b1', '30ccf8f0-c600-42fd-9a20-bea5aa38dd30', '15a973d3-6470-4dcd-ac6a-5a624c94980d', '2260edc0-cc3b-4806-8f25-aa0efdb85130', '7531ff46-7cd9-48f4-83ad-f49a225e5d54']","['build-initramfs-qemu__s37vWsW', 'build-initramfs-qemu__Vu9qLM4', 'build-initramfs-qemu__LapL5Pj', 'build-initramfs-qemu__cVf8tiv', 'build-initramfs-qemu__Wvtonzh']",0,"[900.007355, 914.449687, 902.49105, 96.907217, 914.555972]","[93.090863, 91.254061, 43.595826, 116.787544, 12.176184]",0.0,False,[] +gpt-5-nano,build-pmars,5,"['c3712e0c-b40a-44b2-8f96-38127fc70fca', '7bc5b685-774e-4fe3-bced-e123d29063d3', 'ff39606e-04a5-4885-8ff8-e1b53c5a91c4', '60ee2b95-9ee2-489a-b2ea-828a924a1dba', '577ae939-0eb6-4bcd-b343-fe80131ef274']","['build-pmars__YZEgPgU', 'build-pmars__B3C2PjX', 'build-pmars__ZRxHhxX', 'build-pmars__XeHaDPi', 'build-pmars__4ojp8Qo']",0,"[914.867195, 933.897896, 936.566649, 910.247932, 917.995153]","[10.0119, 15.392677, 103.717317, 7.95142, 5.196139]",0.0,False,[] +gpt-5-nano,build-pov-ray,5,"['2be63c7d-cac6-46a2-82cc-a5a745dc700c', '0d3715ad-cb91-4565-b152-20ba83aaa584', 'b9a2fb57-47d2-434c-a42e-445d31204299', 'bc26752e-5bdf-4bd7-bf2b-52cd3235f7a7', 'fb8ca50c-6998-4f57-bcd8-9fac190b5d7f']","['build-pov-ray__pAGv3WW', 'build-pov-ray__JhEdZFt', 'build-pov-ray__wkumhJD', 'build-pov-ray__Kh9bcoY', 'build-pov-ray__zjdCuKY']",0,"[6000.001924, 6385.659199, 6019.158278, 349.746264, 6004.218408]","[35.900768, 91.764258, 43.510135, 28.023101, 93.601488]",0.0,False,[] +gpt-5-nano,cancel-async-tasks,5,"['990c5dd9-1fd5-478d-91c0-0c15e695b74a', '826c11b1-3bf1-44e8-8e86-c44d87d8f23e', '4f557590-e84d-4199-82cb-3e8532328147', '7c1417e5-2e14-406e-8c63-dfa2066aeb6b', '00d6acb4-b0c3-4921-92a9-a79e3ae67325']","['cancel-async-tasks__voScWFL', 'cancel-async-tasks__vSjEScM', 'cancel-async-tasks__rumaDuJ', 'cancel-async-tasks__Z2w8xgS', 'cancel-async-tasks__myPnmu7']",2,"[460.080179, 1802.185056, 664.885121, 100.905734, 722.041626]","[337.602864, 39.904457, 111.374991, 37.527767, 86.035617]",0.4,False,"['7c1417e5-2e14-406e-8c63-dfa2066aeb6b', '00d6acb4-b0c3-4921-92a9-a79e3ae67325']" +gpt-5-nano,chess-best-move,5,"['db491ae0-036a-49f5-bb19-7c77938c054f', '2142963b-efa7-41e0-9d18-74da4e6db6d7', '2c7c7e86-cf68-4505-9e2d-5ff42416f989', '0d6b6088-f877-4903-8e6b-f4f206e33b0e', '2bd7a599-7fc6-40b9-8a6e-7248ce4fe12b']","['chess-best-move__GiaKWAb', 'chess-best-move__Xyr5Bxg', 'chess-best-move__i9FEM42', 'chess-best-move__LY5pjyg', 'chess-best-move__rxq8BDi']",0,"[900.808594, 92.702976, 901.766858, 534.169005, 901.981711]","[66.286623, 13.401048, 6.644036, 262.800842, 40.265048]",0.0,False,[] +gpt-5-nano,circuit-fibsqrt,5,"['e4b67a7c-7e5c-4904-8cbc-42b2922466da', '81b85d40-cdde-40be-93cb-d604afde25f9', '2457a5ae-6abe-4ca0-95b7-09a0d1082d10', '718354f9-1540-47bb-a84e-afad16a8902d', 'a3d50e87-de59-4380-864a-d6635e8262eb']","['circuit-fibsqrt__QZ9tbSR', 'circuit-fibsqrt__BFKCpBQ', 'circuit-fibsqrt__zA4AqMh', 'circuit-fibsqrt__h2C9qgx', 'circuit-fibsqrt__YRQDjAy']",0,"[3602.854599, 294.273455, 388.051787, 3606.240286, 3607.975236]","[26.696347, 38.612786, 57.086311, 76.23015, 21.254732]",0.0,False,[] +gpt-5-nano,cobol-modernization,5,"['99769767-447e-456d-a1a3-54952767b535', 'ed573b9e-4911-4c60-b655-0a1ae0c8be72', '498aeac8-5ec1-4bf3-84d1-49ea13ff1c24', '1cd8ad5e-b8a6-4758-8387-ff734e24ed01', '95140eb3-87a4-43f4-b332-e72e7853bee7']","['cobol-modernization__gbtRQZa', 'cobol-modernization__YJ2LbHY', 'cobol-modernization__MrqSbiu', 'cobol-modernization__pdhcxok', 'cobol-modernization__tH5HB7c']",2,"[902.784781, 915.022057, 906.29711, 900.012195, 901.324885]","[58.723793, 54.451211, 12.405641, 16.792434, 82.888817]",0.4,False,"['ed573b9e-4911-4c60-b655-0a1ae0c8be72', '1cd8ad5e-b8a6-4758-8387-ff734e24ed01']" +gpt-5-nano,code-from-image,5,"['4670eee4-4547-481a-bd56-f3653ad4dcc3', '835ca73b-5497-444b-9c4d-54011f0f99ca', '3347e82c-2042-4df9-a32b-95dda8fd3ed5', '49807970-2d2e-430d-af9d-6ac04e0cc593', '75393222-87a2-44ca-bd50-1ff1d800d81f']","['code-from-image__Eyp7Drz', 'code-from-image__r9nKEbm', 'code-from-image__dd29fB9', 'code-from-image__MjWnaa6', 'code-from-image__DYXU3wV']",0,"[1222.466232, 153.95484, 1184.555332, 69.547031, 56.311326]","[66.561235, 50.91546, 79.324945, 129.736684, 25.131137]",0.0,False,[] +gpt-5-nano,configure-git-webserver,5,"['a3204fe4-ff67-4c04-b964-451940607141', '3e4cb9a3-00ac-4868-b084-b8f2871e4cde', '4ca825b3-c639-4fe1-afe9-6d2989d64e9e', 'fab04615-c0e9-49be-83c7-677317673e0c', '20fc7cb0-8454-4ba0-a77a-157fb48e2dce']","['configure-git-webserver__X56sHAQ', 'configure-git-webserver__4Umf3Uq', 'configure-git-webserver__Ek5RUyC', 'configure-git-webserver__P8JqApB', 'configure-git-webserver__Eop8AMp']",1,"[900.73465, 329.591897, 904.343931, 548.32542, 364.123252]","[44.479643, 39.753012, 34.891923, 27.275753, 154.905071]",0.2,False,['4ca825b3-c639-4fe1-afe9-6d2989d64e9e'] +gpt-5-nano,constraints-scheduling,5,"['fc2922a6-caf1-43be-9431-10eba3aac8b7', '53551a68-9fd5-4e9c-baf4-c65cc45331a1', '11ece640-c17f-4af1-88bf-20f086da909f', '56f9b237-5bc6-43eb-86c5-9ed3dc3003ec', 'a72ef5f7-7d68-4082-a673-434f60ae3107']","['constraints-scheduling__vp39fXy', 'constraints-scheduling__U7XUboy', 'constraints-scheduling__FRwWfZD', 'constraints-scheduling__DxhjBGU', 'constraints-scheduling__JzH4vB9']",2,"[1200.008872, 184.273481, 828.407854, 395.72651, 227.173906]","[109.034317, 24.471325, 217.289901, 74.229798, 61.322347]",0.4,False,"['11ece640-c17f-4af1-88bf-20f086da909f', 'a72ef5f7-7d68-4082-a673-434f60ae3107']" +gpt-5-nano,count-dataset-tokens,5,"['7137e1ff-6000-414f-a5f6-cfd1125be95a', '053bb4d5-419c-493c-8d7b-974a4ff377e2', 'b6ef5f8f-7e31-4183-b93a-0bd1823cad74', 'b6210482-43ce-4deb-b079-6a454fb2009e', '3a829fcb-6d95-440f-a000-9974dc4829f9']","['count-dataset-tokens__7NwA5oR', 'count-dataset-tokens__grZkVEk', 'count-dataset-tokens__h4uDByR', 'count-dataset-tokens__karyExk', 'count-dataset-tokens__KvYcuBM']",0,"[925.964914, 900.696784, 907.084235, 904.839144, 907.80398]","[53.130197, 8.732161, 56.208427, 43.965044, 24.728799]",0.0,False,[] +gpt-5-nano,crack-7z-hash,5,"['23bfc685-cbb6-4c5c-b82e-bc461cb3aa8f', '1adf4074-c319-4dd8-90cf-634436a52465', 'a7a908e7-31e2-40e0-aa16-d2a86f9dfcc2', 'e6b7f583-3355-41c2-9414-dcfe10720c51', '1af73754-908d-48a5-8f4d-670dad2c377b']","['crack-7z-hash__euH6Yss', 'crack-7z-hash__VqyLi8t', 'crack-7z-hash__gBU4cP7', 'crack-7z-hash__q6NQdmJ', 'crack-7z-hash__2VNQjhs']",0,"[64.506897, 256.013581, 492.663071, 171.686959, 68.582114]","[56.598805, 50.068922, 14.469331, 10.80913, 17.168868]",0.0,False,[] +gpt-5-nano,db-wal-recovery,5,"['6cd1a883-1863-4e38-a56b-4ea43bd653cb', '0abb0c24-8bb1-4527-ad5a-49d17b2c644d', '9c6dd741-2410-4197-a925-044d060d9720', 'a904a358-9444-48b2-9eba-1f11512c38e3', '7da5b938-c498-4939-8818-e00a125d6cdf']","['db-wal-recovery__A4LALCh', 'db-wal-recovery__3NMNZBh', 'db-wal-recovery__X2ZMFj9', 'db-wal-recovery__xgSSAKR', 'db-wal-recovery__9fXPcSu']",0,"[906.782637, 205.118138, 911.419391, 1029.392734, 927.362762]","[23.752168, 10.261984, 35.518634, 33.020635, 50.651688]",0.0,False,[] +gpt-5-nano,distribution-search,4,"['17fc11cb-44ae-467b-b3f5-70f6356768d6', 'dbafd7d3-b05a-4122-a6eb-4aff4f5429bb', '73817b8e-be63-4f2b-8f38-fae064fee451', 'e0bff138-ed86-4280-af1f-9878992d0fd8']","['distribution-search__FXzbZAc', 'distribution-search__CQoGwDf', 'distribution-search__VJkmjzE', 'distribution-search__FKWn6WX']",1,"[3605.859821, 1625.734429, 3623.688132, 3346.798907]","[49.761326, 13.779635, 32.685024, 156.217475]",0.25,False,['dbafd7d3-b05a-4122-a6eb-4aff4f5429bb'] +gpt-5-nano,dna-assembly,5,"['0d6e0e62-c526-4ab5-aea5-c940724e5ed5', '53aff598-a8bc-4185-9886-e7358a8e4855', 'bbd20cd8-d85d-4209-aa0e-7f903574c031', '41a0673e-5b36-478a-8531-e20d17c277e3', '0bd08ad3-9ba8-432e-b6f5-49acfedc5930']","['dna-assembly__8DSrtzo', 'dna-assembly__EZwV5vJ', 'dna-assembly__bzWdq5G', 'dna-assembly__XMDvsS6', 'dna-assembly__bzduUDW']",0,"[763.386427, 720.48179, 749.742164, 777.270451, 726.593836]","[47.386939, 108.11111, 38.062341, 62.907129, 37.266134]",0.0,False,[] +gpt-5-nano,dna-insert,5,"['7ee4a787-9089-44a9-a2b5-36d1ef3de55b', '6046336b-df29-46ae-b9c8-e05953dbc3a5', 'e0197869-c39e-46de-9997-f166d5f72c42', 'b640f0d1-80dd-433e-a775-a32107ab13d4', '3ae940eb-4526-43c7-8ae0-64992c03d6e2']","['dna-insert__nA5bZ3n', 'dna-insert__REMxtTz', 'dna-insert__f9miGwM', 'dna-insert__AtBPHTT', 'dna-insert__onEjgYK']",0,"[360.376733, 377.771084, 262.533636, 367.3831, 365.536655]","[314.445466, 31.075986, 22.823325, 82.432496, 36.638198]",0.0,False,[] +gpt-5-nano,extract-elf,5,"['d3180dfd-7a50-456c-bba9-b4a5cdbf8dca', '289122a3-a0f6-4e6c-a79e-b5606784f55c', '682a1d0f-6c73-418b-9ccb-91c68c9c52ee', 'f5e368ff-0c49-4219-8bce-bf96656ec774', '53057808-b2b1-4c79-b74e-8f5d347f9681']","['extract-elf__dQC6kPA', 'extract-elf__48ubrMx', 'extract-elf__CbYgTeZ', 'extract-elf__MVfncej', 'extract-elf__DgiasJa']",1,"[562.913072, 900.607172, 272.078997, 144.633765, 794.774017]","[185.020625, 112.861971, 40.692187, 31.855138, 39.140182]",0.2,False,['53057808-b2b1-4c79-b74e-8f5d347f9681'] +gpt-5-nano,feal-differential-cryptanalysis,5,"['f52f0682-0868-4a95-b8d3-993e5b0193d6', '68680041-9cba-41e2-9c3f-dd96b88b2d5f', '6d607abd-05fd-4082-b28a-1135da5b0691', '02ae6604-753c-4223-9a00-e37ef33b9b7e', '6bde58e3-f9f7-43e5-aec1-c40e9777c281']","['feal-differential-cryptanalysis__WZG67NL', 'feal-differential-cryptanalysis__tHc94Xc', 'feal-differential-cryptanalysis__AJWm3Xp', 'feal-differential-cryptanalysis__kBxxMcU', 'feal-differential-cryptanalysis__NmybV4g']",0,"[287.896496, 1803.213401, 657.022342, 656.719255, 98.026569]","[10.703465, 82.554957, 248.119638, 41.937767, 60.368581]",0.0,False,[] +gpt-5-nano,feal-linear-cryptanalysis,5,"['7c3f8538-4107-41eb-925b-c9bccea0e5a2', 'b6f560d3-deaa-4f3a-b992-31d217167d50', '3eec3656-5c4c-47e3-9fe3-06c9173dde87', '9ac5dae9-28fe-4097-a195-b100e6eeff70', '422b814f-151b-4462-8cef-51b3e31e6772']","['feal-linear-cryptanalysis__LWjHZg2', 'feal-linear-cryptanalysis__iHa8v8s', 'feal-linear-cryptanalysis__26k8MfZ', 'feal-linear-cryptanalysis__t3UytMz', 'feal-linear-cryptanalysis__H6BTeXg']",0,"[1800.110598, 1801.367497, 1801.069087, 1814.425211, 1801.318975]","[108.602773, 66.730305, 20.968674, 14.802508, 81.240702]",0.0,False,[] +gpt-5-nano,filter-js-from-html,5,"['61d5f61b-b128-4458-a7ec-7feb734a3ecb', '0c0067e5-be3d-4c9a-b1fd-7beaf3e13183', '35b5fddf-7745-455a-a57a-503f7f61e8f1', 'efac70da-c352-4c81-bd24-539ad85b4ac4', '59851ada-2785-4dd3-9a66-b68ee935e8ce']","['filter-js-from-html__p7cD6Cn', 'filter-js-from-html__UW2qLH5', 'filter-js-from-html__Ro7ser8', 'filter-js-from-html__VWnYWUw', 'filter-js-from-html__7ffv6uY']",0,"[901.618909, 676.114883, 123.623545, 407.989321, 176.890287]","[23.49958, 78.022613, 32.3418, 33.119769, 131.721562]",0.0,False,[] +gpt-5-nano,financial-document-processor,5,"['f47bbcd0-0dc1-4b82-a0c9-f589ed8a8e5e', '55f435f7-9ef3-47f7-b0a7-eabab131c186', 'd68797a9-d08b-4030-b2ee-2ff60b01fe06', 'd714136b-c860-4e04-9679-f00f0b6db4c0', 'aac3df65-1bf8-4494-82b7-f5f75aee8695']","['financial-document-processor__BbXK2XQ', 'financial-document-processor__huNWGau', 'financial-document-processor__fpM5eQm', 'financial-document-processor__j2xUUNQ', 'financial-document-processor__iZMGjBp']",0,"[1225.38529, 761.460402, 1200.602162, 1202.752336, 1200.108211]","[292.572407, 21.339335, 39.412825, 146.980919, 34.52988]",0.0,False,[] +gpt-5-nano,fix-code-vulnerability,5,"['09dc4105-c9fc-49da-8959-27c1e147259b', '69cd9f98-6da5-4c76-ad99-d47dabe2afcf', '5e080ce5-9c64-4547-965d-d696d130cdff', '49e7cfda-6d56-4511-bf5f-7745371f2f09', '98e7d43f-3346-484b-95af-e4f918ce8f56']","['fix-code-vulnerability__y7rwtGh', 'fix-code-vulnerability__PHoPuPp', 'fix-code-vulnerability__HTKDqEf', 'fix-code-vulnerability__jQySPeH', 'fix-code-vulnerability__R4jmGUx']",1,"[941.852106, 901.082412, 482.756827, 487.895402, 907.712192]","[11.656371, 75.900789, 27.625839, 45.508529, 25.140437]",0.2,False,['5e080ce5-9c64-4547-965d-d696d130cdff'] +gpt-5-nano,fix-git,5,"['97d75b2a-29f8-4ef3-8335-d46a62c03d36', '41972ba3-40f1-401f-8e1b-9b1f30d968ee', '3b1899c8-d1de-4339-8075-b83647c72bca', '3de7e646-8d0e-4e5d-b101-8fe9ed95c696', 'a5e689c1-171d-413d-8c92-bef40f6ae730']","['fix-git__rm5mSDA', 'fix-git__en3V8oT', 'fix-git__CUPRo35', 'fix-git__sfDuCwa', 'fix-git__cnhCc6k']",0,"[900.000949, 914.106193, 944.405087, 161.950019, 900.491035]","[67.792615, 25.628736, 32.41048, 39.792231, 27.393882]",0.0,False,[] +gpt-5-nano,fix-ocaml-gc,5,"['673c7816-af07-49bf-ad7e-10c18faa8a22', 'c69c8afe-4980-46eb-a46d-13aefce461a8', 'b3060adf-9e7a-49e8-9cdb-255d0a55824e', 'ed62e705-c932-4025-88d1-62b3c072d761', '9cc9746f-d489-4cef-895b-fd574f6efe79']","['fix-ocaml-gc__hxdQ24V', 'fix-ocaml-gc__vqy9dPS', 'fix-ocaml-gc__mM7Zdfd', 'fix-ocaml-gc__hwAPua2', 'fix-ocaml-gc__6QySpQd']",0,"[3609.446217, 3602.946318, 3605.157478, 3636.301606, 3754.157715]","[81.436061, 230.150204, 60.177807, 32.905947, 16.613593]",0.0,False,[] +gpt-5-nano,form-filling,5,"['9bbd4c87-46d0-4cbe-bdfc-e74e312bc832', '7e9b0249-63a0-4493-b28a-b435613bb6df', 'ee0e0171-41f4-4a7b-bdab-d19d1cb6fd0b', '77a76ef4-1645-4147-ab67-54cf6e6b9164', '461e5645-b536-46ca-ae64-54915d481555']","['form-filling__EsRvgPw', 'form-filling__gcE76Eu', 'form-filling__jfiAYAz', 'form-filling__ueNBkGw', 'form-filling__tvtNnyt']",3,"[256.983497, 907.71556, 900.243668, 416.223106, 900.001958]","[9.929134, 61.797626, 18.689936, 63.142766, 4.720854]",0.6,True,"['9bbd4c87-46d0-4cbe-bdfc-e74e312bc832', 'ee0e0171-41f4-4a7b-bdab-d19d1cb6fd0b', '77a76ef4-1645-4147-ab67-54cf6e6b9164']" +gpt-5-nano,git-leak-recovery,5,"['3c480d88-4a55-44b1-af7d-46492ec5566e', 'cc1766a1-f6e5-47c5-95b1-7bb245917dda', '0142a589-2275-40dc-83ef-e50cd901e96b', 'b7c1c784-0825-45ea-b9b7-ea5f5cdef6ad', 'bffcb8b2-e1a3-4c0e-85ef-ed3107738cb0']","['git-leak-recovery__6w5ezGU', 'git-leak-recovery__aWUq6zn', 'git-leak-recovery__TvjkMTZ', 'git-leak-recovery__dfk2Jjo', 'git-leak-recovery__nU6BNxF']",0,"[458.77393, 902.702985, 904.121029, 901.068127, 601.066027]","[24.936984, 55.064919, 18.217005, 71.682049, 44.841613]",0.0,False,[] +gpt-5-nano,gpt2-codegolf,5,"['c16559a9-59ee-481d-b510-788461242ac5', '10dfff30-00b3-43d0-a2c2-c2cad7fb6bb0', 'fa1b68d9-d614-45d9-8ebf-f3a21725b8d9', '8d3adc34-f187-4fd7-b340-af9148621a19', '7ad021cf-1982-4b5d-b60f-b91981a835b0']","['gpt2-codegolf__thwHU4y', 'gpt2-codegolf__ZHNHTyC', 'gpt2-codegolf__XFiNw42', 'gpt2-codegolf__MLAqdmY', 'gpt2-codegolf__wEYtM2h']",0,"[900.018413, 901.495722, 900.768369, 102.798116, 949.044162]","[219.060269, 193.215395, 103.544034, 25.613981, 57.401584]",0.0,False,[] +gpt-5-nano,hf-model-inference,5,"['970ca86b-aafb-48bd-a7ce-bc3ec4588332', '5642bbdb-5db2-4b69-b0d0-15460143bda9', '98091376-b51e-4e89-9202-c1f81028fef5', '038bb50c-ccdc-4445-b3de-9dd8fc634fb8', 'c780b22d-8449-4cdc-a780-497bb698fcdd']","['hf-model-inference__gx9683m', 'hf-model-inference__2SXEQv6', 'hf-model-inference__jWY5idP', 'hf-model-inference__tZHuPLB', 'hf-model-inference__9u4qDgc']",2,"[900.225072, 355.19306, 902.801198, 919.773131, 908.559964]","[50.265115, 65.704146, 61.980139, 55.032067, 31.828349]",0.4,False,"['5642bbdb-5db2-4b69-b0d0-15460143bda9', 'c780b22d-8449-4cdc-a780-497bb698fcdd']" +gpt-5-nano,install-klee-minimal,5,"['629b43e9-8e89-4f34-9004-6784580e5a67', '64ce5bed-560f-46fb-bc68-cea7f9de44e9', '855c43de-db94-4716-bd16-447df015a462', '6f7e81f4-2106-46ce-a146-1117b652b5b9', '0860a3c3-5625-49d1-90f8-dc9995c12d79']","['install-klee-minimal__RdMjtKm', 'install-klee-minimal__CY2dNCj', 'install-klee-minimal__34Mp393', 'install-klee-minimal__87QXnYC', 'install-klee-minimal__RyQvTLe']",0,"[900.000366, 900.045389, 908.930039, 906.13521, 904.415734]","[126.511244, 91.397976, 111.532395, 53.4906, 65.683912]",0.0,False,[] +gpt-5-nano,install-windows-3.11,5,"['9d56ce29-ed76-4b8d-930f-13bc9f52d980', '0e457e46-8c98-4bb5-b194-afdf0341ec38', '4dd404b1-9531-4591-bc85-7365e9d1cf32', '10c38cce-7071-45e3-986f-353c400687c3', '4866015e-5bef-43d0-8438-ab03733d0827']","['install-windows-3.11__y9Kuy8H', 'install-windows-3.11__xW9VqX3', 'install-windows-3.11__ZTYs4n4', 'install-windows-3.11__bgqH3fc', 'install-windows-3.11__YVwW6dK']",0,"[3690.493455, 3603.047322, 3627.529185, 3607.163798, 3602.906463]","[123.026224, 57.357771, 74.106206, 63.929858, 45.483278]",0.0,False,[] +gpt-5-nano,large-scale-text-editing,5,"['d9d92238-1c00-4e5f-9338-75bf9c7b971d', '8b85ef64-6d93-4709-8389-ae308d21f572', '4623c750-29fe-439d-9da3-5e054c4f4487', 'f6c10a37-d9b6-4bec-94ab-62199b043b44', 'cfd431b1-27ad-4425-9d64-2a9bf2fe1dd7']","['large-scale-text-editing__pszrnLc', 'large-scale-text-editing__4SDMSqZ', 'large-scale-text-editing__EoLATii', 'large-scale-text-editing__XLY65rY', 'large-scale-text-editing__AfL7Dxd']",0,"[1200.415566, 1201.750252, 1219.124585, 1203.651723, 1202.879457]","[14.856641, 35.59247, 21.220816, 146.697001, 97.308247]",0.0,False,[] +gpt-5-nano,largest-eigenval,5,"['f382387a-f40c-4c84-a149-9b29cd49a982', '93dab8c0-ef8d-4c05-afc1-05172496bc0d', '06a5b16c-5f7c-4c70-88b4-f0f359cad74f', 'b5995c9d-2352-41c7-b551-3aef028555e1', '8bbcd39e-a612-430e-8ceb-b9625fe25c1c']","['largest-eigenval__NJiicK5', 'largest-eigenval__Py95mN8', 'largest-eigenval__6QELdgj', 'largest-eigenval__FYUsRyv', 'largest-eigenval__EJk2HPm']",0,"[962.463437, 900.132336, 364.138481, 179.300111, 901.424654]","[353.371833, 88.372926, 37.126459, 69.630562, 55.091421]",0.0,False,[] +gpt-5-nano,log-summary-date-ranges,5,"['34fdaf91-a5c2-4665-b2e2-4ccdc1bdb96b', '8e1c2727-a184-4e68-ba6e-58e6a218776b', '64f73997-df8d-400d-8979-30263167536a', '2b338aec-06df-42c4-83ca-9331c028f363', 'ca89ec53-ac5b-4b58-a815-b2ef8c7acc64']","['log-summary-date-ranges__jEFRgQc', 'log-summary-date-ranges__DuqHy4f', 'log-summary-date-ranges__jRFemeP', 'log-summary-date-ranges__B4bnidx', 'log-summary-date-ranges__4imijev']",0,"[210.414753, 160.143288, 270.259882, 909.398653, 569.005703]","[35.568965, 58.628973, 78.04667, 20.898206, 170.330511]",0.0,False,[] +gpt-5-nano,make-doom-for-mips,5,"['e90fcddf-fe64-4f44-b12e-d9e9cfd3f3ff', '165cb0e9-b188-4aea-a751-3c7fda1f7a96', 'f2f0e62a-53d6-46e4-8079-18e35b7275b0', 'e8e31986-ae94-4e34-81af-91c0c82aa908', 'ee4d7c74-c247-4ff3-9e0d-8cadcfe5fa99']","['make-doom-for-mips__SN9Xofo', 'make-doom-for-mips__Whvpn3x', 'make-doom-for-mips__UM8gtYV', 'make-doom-for-mips__RV5QYi3', 'make-doom-for-mips__AHgHyNV']",0,"[901.505165, 914.385128, 908.780469, 916.42802, 912.645415]","[214.121554, 23.922208, 48.366434, 160.332211, 64.973788]",0.0,False,[] +gpt-5-nano,make-mips-interpreter,5,"['65fe6f82-b3f0-449f-82da-6f921c417aac', '7ae47306-bb3e-4241-99b7-6f18db50f9ba', '3419b2e9-3ed1-4023-a468-6727a860e5c1', 'f3a3ad4b-e2cb-40a7-ae48-f7108907aa2d', '6658a3e1-aceb-463c-bf12-ce4e697d9b2f']","['make-mips-interpreter__QFgJovf', 'make-mips-interpreter__Z866Rpw', 'make-mips-interpreter__bmbm6e9', 'make-mips-interpreter__q227euw', 'make-mips-interpreter__zMw6BYc']",0,"[1805.38438, 1806.515231, 1804.836996, 1807.654461, 1814.332045]","[127.785937, 65.200409, 36.764687, 111.918515, 51.350861]",0.0,False,[] +gpt-5-nano,merge-diff-arc-agi-task,5,"['02188842-7988-46c0-9b17-aa49ad59b165', 'fde69992-1800-47c4-9d93-91cf2c32cc66', '327ce27f-451c-41c8-af2e-5d9e53a71ae3', 'c0073804-2144-4929-84d3-328610350b0f', '81e72b55-e7d9-4231-975e-f88995ed20bb']","['merge-diff-arc-agi-task__NkPif2P', 'merge-diff-arc-agi-task__dVma57k', 'merge-diff-arc-agi-task__8hxeAGK', 'merge-diff-arc-agi-task__gB2YKst', 'merge-diff-arc-agi-task__4x7B8uJ']",1,"[454.908975, 503.875515, 900.947232, 587.703042, 517.514929]","[21.30923, 19.473718, 215.889313, 67.053352, 59.550437]",0.2,False,['02188842-7988-46c0-9b17-aa49ad59b165'] +gpt-5-nano,model-extraction-relu-logits,5,"['e4702c73-23fe-4201-82fe-620d5476ae24', '9b5f79b7-4cae-46fe-af17-9089d001ff9a', 'fb125afa-5585-418f-ab83-032d673b27e7', '6b73e5ba-8a2c-4ee2-984e-1dd88b92edd1', '84e09410-005e-4e47-97d7-8030f323b93c']","['model-extraction-relu-logits__4s39v6A', 'model-extraction-relu-logits__4sY5xx5', 'model-extraction-relu-logits__tgvQoGz', 'model-extraction-relu-logits__BRtUAMt', 'model-extraction-relu-logits__6vHtwxM']",0,"[281.321433, 175.789692, 179.623617, 136.355575, 82.519475]","[9.172811, 15.463658, 56.700956, 24.515249, 29.621255]",0.0,False,[] +gpt-5-nano,mteb-leaderboard,5,"['1054b191-da06-4c38-ae19-80558f15013d', '4e4777b1-039c-4424-b2ac-9ce9766f3318', '696ff5d1-b026-4504-a0e2-f6202d0f75d3', 'a6c234d0-7f6e-4d6e-8bf6-5597ad03552d', 'bf5c4722-0681-4a25-9e99-117934b010eb']","['mteb-leaderboard__5E8b8zA', 'mteb-leaderboard__abDPc65', 'mteb-leaderboard__KKY4Pgc', 'mteb-leaderboard__CZbn59E', 'mteb-leaderboard__sacnY3a']",0,"[1732.246102, 3602.432102, 3600.029678, 3630.082023, 1937.702894]","[14.344208, 5.22135, 20.638589, 4.26335, 13.587451]",0.0,False,[] +gpt-5-nano,mteb-retrieve,5,"['8ca72de2-e04c-4965-9955-fb7e9255a194', 'bb47de03-a41f-40bd-8987-b98c7c77e614', '9c3f8abf-d5d2-4983-9ca7-877008d5ec55', 'a54a7151-0004-4aa8-b5cc-9f0706a355cd', 'edcf76a3-f793-47af-88e8-9c384dbd5c26']","['mteb-retrieve__tUWbtcm', 'mteb-retrieve__yaEdbqm', 'mteb-retrieve__YxMo3Xg', 'mteb-retrieve__y3NPFii', 'mteb-retrieve__JzBXhH7']",0,"[1875.76028, 499.205285, 1818.220261, 309.128176, 661.036411]","[6.440081, 103.658655, 155.622303, 13.01281, 6.609595]",0.0,False,[] +gpt-5-nano,nginx-request-logging,5,"['77dbb26b-f9e8-4986-a7c6-b5a082d9434b', '680d091d-b56f-4390-ae80-3093fd2f9848', 'c3fdf7a2-5574-4425-a528-fbecb571513f', '6d544b26-fd7d-4ef4-8682-50666e5bb0fe', '70dbedd7-20e1-40bf-bda0-aaa50480231b']","['nginx-request-logging__u2qHY7M', 'nginx-request-logging__L3BkJva', 'nginx-request-logging__68LqrU5', 'nginx-request-logging__dAsMuHK', 'nginx-request-logging__xJJ6Kuj']",0,"[949.775719, 364.983412, 900.624736, 900.667918, 1024.089891]","[58.964165, 66.59209, 85.344756, 49.833166, 26.499578]",0.0,False,[] +gpt-5-nano,openssl-selfsigned-cert,5,"['80be214b-0f04-4ee2-9316-7635e4fa5b4b', 'c38caa6f-3413-41de-a0cc-32b74ba3df61', '46146ca3-5f7a-4caa-bb8d-47b4c5c578e9', '6626d907-53dc-493f-a9d5-1c26a5a909a7', '688961b2-6e1b-4b48-a3a4-a8fef9ac0a97']","['openssl-selfsigned-cert__oj2Ffyy', 'openssl-selfsigned-cert__QMXehoo', 'openssl-selfsigned-cert__ZjRJwpN', 'openssl-selfsigned-cert__HGcRvCo', 'openssl-selfsigned-cert__PDtSmRY']",3,"[904.478958, 631.43602, 292.403505, 907.278233, 111.455464]","[78.413402, 45.907458, 54.044038, 69.24579, 27.672617]",0.6,True,"['c38caa6f-3413-41de-a0cc-32b74ba3df61', '46146ca3-5f7a-4caa-bb8d-47b4c5c578e9', '688961b2-6e1b-4b48-a3a4-a8fef9ac0a97']" +gpt-5-nano,password-recovery,5,"['39245809-5dc6-43dc-8f46-22354480c47c', '30bdcb90-bc1d-4a29-9096-19acace470b1', '7ac78740-c58b-4094-9c33-f21ac74c901c', 'a171470f-6272-4e3d-b8f3-9dbff056014a', 'd593c474-e661-4e82-b792-3f9d10ba32e7']","['password-recovery__YTgaPVh', 'password-recovery__XH58Noe', 'password-recovery__c2dNndq', 'password-recovery__kjuy6Vv', 'password-recovery__3W4dHvA']",0,"[900.719173, 1666.422786, 904.616632, 906.166665, 913.197578]","[20.445888, 44.3351, 42.484131, 16.930823, 73.050932]",0.0,False,[] +gpt-5-nano,path-tracing,5,"['9c26cd4c-dec9-40b5-8ef6-93a5b6d08c0b', '2e51ad5d-5c3a-4d14-8926-48ae06a8c5b3', 'e5471318-1caa-40f6-a2b5-12e33bb82412', '8aec5210-c091-43e9-b017-443c52659ff9', '621655c2-b7af-40db-a72e-cb970121a00a']","['path-tracing__dYFiVX9', 'path-tracing__syukYue', 'path-tracing__uG2XDpg', 'path-tracing__CokLQhC', 'path-tracing__DAKvoz8']",1,"[1800.037215, 233.00758, 175.308208, 1810.486239, 198.459098]","[13.869916, 22.055946, 85.591261, 52.895138, 93.71186]",0.2,False,['9c26cd4c-dec9-40b5-8ef6-93a5b6d08c0b'] +gpt-5-nano,path-tracing-reverse,5,"['e972881c-6cea-4ec9-b84d-837fc49c8a5a', '0ec63e4d-e64b-4faf-905e-11f4429ba99a', 'c348ce81-3e52-4f5d-a78e-a9afecac119f', 'ca928ae5-9635-4af4-907e-c3cdc9f0e2f4', '440d0bb1-dfbd-4ade-8eac-44e30c4882be']","['path-tracing-reverse__dqJtbdZ', 'path-tracing-reverse__6V3mqgX', 'path-tracing-reverse__G3Xk8Q7', 'path-tracing-reverse__ddC2eHr', 'path-tracing-reverse__uvkm65N']",0,"[136.947874, 197.725017, 1835.192355, 277.176631, 206.151477]","[71.751, 27.762015, 44.100424, 90.437366, 133.289303]",0.0,False,[] +gpt-5-nano,polyglot-c-py,5,"['50335ce8-c241-4552-932f-270ce3c2edf6', '45d38a12-2f53-4e66-899d-f533b5abcc7b', '97ec64aa-2fcb-4bb7-953e-23a611902e4b', 'dc7b00c1-2147-4661-80c8-e69303f139c9', 'c4ff3e74-a8c1-42a2-9c4a-fdcd281ae138']","['polyglot-c-py__V7JX5K9', 'polyglot-c-py__nWfjazp', 'polyglot-c-py__BWivZzs', 'polyglot-c-py__qi6zLxj', 'polyglot-c-py__mF8rkA2']",0,"[900.234927, 254.236836, 900.141671, 595.425073, 963.991313]","[18.601157, 40.066066, 22.913337, 21.288558, 48.527259]",0.0,False,[] +gpt-5-nano,polyglot-rust-c,5,"['e258f068-1643-497f-ab31-bbfdfa81ce10', 'a32840b5-36e0-4886-8b60-2037a03aa1c8', '2df9a216-4d5e-4759-87b5-4bd5fbbbbd0f', 'b5633c60-56d3-4f50-b097-4d8f6daaaab6', '2962dabc-034a-46bd-bf05-ff32266dae34']","['polyglot-rust-c__sn3zYWG', 'polyglot-rust-c__AbYXmHy', 'polyglot-rust-c__ACUbDtS', 'polyglot-rust-c__HwnMzE9', 'polyglot-rust-c__Txoma6x']",0,"[308.956451, 905.077738, 252.606981, 900.140924, 566.271415]","[76.148557, 32.574352, 77.889956, 147.171377, 25.577537]",0.0,False,[] +gpt-5-nano,port-compressor,5,"['e1e39383-bdb7-4ee7-beaa-ac30ab3fb79d', 'e144c3ee-6855-4f5b-ba63-d5d340cecfdc', '1f2e4859-5af4-4c45-b5fc-c47a1e1d7805', '161963d5-cb87-4201-b53c-d2f404212cf6', 'ccd9e1fa-a7ba-4fa0-aa1e-a71b76611493']","['port-compressor__ksCaKQS', 'port-compressor__rDdHCFp', 'port-compressor__oabz7FY', 'port-compressor__Nr3WxZM', 'port-compressor__vbmm9Vo']",0,"[3605.16392, 3611.691835, 3611.687095, 3618.307337, 3624.441471]","[75.821205, 35.064604, 131.756165, 61.510354, 89.832871]",0.0,False,[] +gpt-5-nano,prove-plus-comm,5,"['0537cba9-14d9-426b-accc-b07c2542ec08', 'ff8cb9a5-0d28-43d6-856f-30f8acede506', 'b91e580b-5594-4a12-b0ad-2d56402df695', 'edba987e-f279-4308-824a-27050f2e10c4', 'e9a8641f-ecd3-412c-995e-4d3eb69c96bb']","['prove-plus-comm__QLZQmRY', 'prove-plus-comm__25x55Xk', 'prove-plus-comm__EfbtRHy', 'prove-plus-comm__cG9Ga8m', 'prove-plus-comm__Gz2TiBL']",2,"[291.844602, 900.001055, 393.440593, 900.023277, 905.307202]","[133.897335, 19.711799, 27.508151, 68.154503, 88.506395]",0.4,False,"['0537cba9-14d9-426b-accc-b07c2542ec08', 'b91e580b-5594-4a12-b0ad-2d56402df695']" +gpt-5-nano,pypi-server,5,"['6bbed1dc-90b6-49e1-b51b-9421dd2357a7', '34477d7e-073b-4318-be0e-a3bd68463ff8', 'fcc48f6a-b8e3-470d-a3a8-e81424264169', 'e76f8a22-4753-4a60-a71e-88e90d1a56c4', '95bddb5a-2652-4efd-9591-97f7b3514602']","['pypi-server__SVidBxE', 'pypi-server__iJQsJEp', 'pypi-server__NG3Q9MQ', 'pypi-server__BbS9HkL', 'pypi-server__LY9zirN']",4,"[153.238482, 689.40874, 422.243813, 393.226204, 761.841603]","[221.748391, 37.933902, 58.656173, 101.585712, 35.696333]",0.8,True,"['6bbed1dc-90b6-49e1-b51b-9421dd2357a7', 'fcc48f6a-b8e3-470d-a3a8-e81424264169', 'e76f8a22-4753-4a60-a71e-88e90d1a56c4', '95bddb5a-2652-4efd-9591-97f7b3514602']" +gpt-5-nano,pytorch-model-cli,5,"['0af69304-388b-4d13-9bb5-5c4c68dc7e7a', '7a594bb1-d629-4dfb-988a-5438205bb1b1', '698521b5-5662-4dd0-a19c-d26b80bb331c', 'b2a74ab0-ebb0-4e5d-a07a-2797d666e93c', 'd950ea69-fb26-4f9d-952e-438aaad28903']","['pytorch-model-cli__aPg8M7A', 'pytorch-model-cli__cTyMs3k', 'pytorch-model-cli__GhwUrGG', 'pytorch-model-cli__Monrytt', 'pytorch-model-cli__NRu3Xg7']",0,"[268.352405, 237.045804, 259.063906, 397.23751, 228.27177]","[88.783945, 90.552549, 682.697742, 78.860996, 66.092121]",0.0,False,[] +gpt-5-nano,pytorch-model-recovery,5,"['493ad8a8-e41a-4ce8-963a-9c55de766bb9', '3f228cc5-63d7-4967-89ec-e7900164b9fa', '0672684b-ebda-4e1d-acc5-52d9e356988e', 'e7375bf0-2717-40e4-a96f-fda52d20e679', 'e9996573-f61f-4367-ac8f-bf03cbd6f27e']","['pytorch-model-recovery__c6XhCmi', 'pytorch-model-recovery__ohbiH6h', 'pytorch-model-recovery__8znk5pE', 'pytorch-model-recovery__dWh8tur', 'pytorch-model-recovery__gE5jEWq']",0,"[872.056794, 903.244122, 900.016947, 909.594941, 900.822114]","[59.183923, 53.682841, 60.379743, 115.5091, 24.597713]",0.0,False,[] +gpt-5-nano,qemu-alpine-ssh,5,"['6ef1dad1-d823-42e5-a1e3-117d483db278', 'f9f68cdd-0841-42d5-9e3e-d98afcbd13a7', '98b8eb3e-c817-4dc4-866b-a13c87499d34', 'e635faf0-4425-491c-bb67-c68b6c4e2a3f', '7c9c2355-4935-4171-addf-d64d8b29ba6a']","['qemu-alpine-ssh__wSmpEL8', 'qemu-alpine-ssh__Saxh58z', 'qemu-alpine-ssh__cx8gLYL', 'qemu-alpine-ssh__B8Uhakt', 'qemu-alpine-ssh__2yRsvx9']",0,"[921.555876, 902.626363, 963.531137, 900.117622, 958.775217]","[74.642899, 10.722509, 18.389077, 9.51599, 10.00116]",0.0,False,[] +gpt-5-nano,qemu-startup,5,"['96fcd209-7c8e-4aeb-bf4f-e338ed706b7e', '62525c68-1e86-4fdb-ba64-af72b9852e38', 'a8681aad-3ca2-47af-b5de-071081dd86d2', 'cf0ad0f1-34fe-4b91-9ff7-b224629be63c', 'fd21b178-e94e-457e-843d-0fa650c40962']","['qemu-startup__5oxXxTY', 'qemu-startup__PQ53yCe', 'qemu-startup__rDoKSGm', 'qemu-startup__SzCPi2k', 'qemu-startup__3YXfB7p']",0,"[900.068942, 903.429558, 900.401521, 900.477429, 1018.652489]","[9.609038, 3.565991, 43.608103, 15.201265, 108.452161]",0.0,False,[] +gpt-5-nano,regex-log,5,"['133cf151-a73c-4e37-b206-1a1ebef24c8a', 'fc3994c7-1b37-4348-a627-386c2c3e9cf1', 'dedfc082-a80d-4c5c-89af-924c1e36c9f3', 'c9ec3100-e9e8-44d8-ae46-2e5bc7dfb6af', '1a8b49d3-d115-4794-966b-0b697e0022db']","['regex-log__UnyFziT', 'regex-log__tqwWNfR', 'regex-log__oJzJ3Z5', 'regex-log__ugh4Cui', 'regex-log__EJ9JWtw']",1,"[764.706026, 900.00096, 905.945441, 2352.316519, 449.711529]","[150.725566, 208.465253, 32.512404, 180.473659, 30.93433]",0.2,False,['1a8b49d3-d115-4794-966b-0b697e0022db'] +gpt-5-nano,reshard-c4-data,5,"['376f51b0-482f-4d72-a54a-489420db51cd', 'd4cb8f39-4bdd-4041-b050-b84e1a24326a', 'bf0c9adf-fc31-477b-b11d-4a636e50cc38', '43fd16c4-d907-46a8-90cf-7c75e1323de9', '13248c77-6e02-40db-85af-dd677750d2a6']","['reshard-c4-data__N69WnHa', 'reshard-c4-data__PhKaDsg', 'reshard-c4-data__mLvPtM6', 'reshard-c4-data__fZ3ecFT', 'reshard-c4-data__3Kqwksj']",0,"[1684.60652, 341.528637, 488.023741, 454.477631, 900.162178]","[45.860974, 111.079536, 23.832204, 178.274831, 100.240504]",0.0,False,[] +gpt-5-nano,reverse-engineering,5,"['b6f91ed2-0f3d-426b-b2be-5913bcc21bb9', 'cc16e299-1e99-4e4c-9fff-506d05a1f9f8', 'ad2eb0e5-ef69-4731-acff-d21a23053218', '513b7b5c-cc32-4c6a-9a1e-0f995451893c', '390ea97a-778b-41ea-bb44-c524dc8df9d7']","['reverse-engineering__yS6WYdo', 'reverse-engineering__BuDKV6S', 'reverse-engineering__r2wwW3u', 'reverse-engineering__WBFEaQ8', 'reverse-engineering__AoszQ2x']",0,"[1830.366763, 1803.798913, 1827.004584, 1803.218777, 1801.412052]","[13.713853, 42.899427, 85.57079, 7.320691, 79.888227]",0.0,False,[] +gpt-5-nano,run-pdp11-code,5,"['83f1cb26-954b-4f4e-a648-7e09fd2f6e7f', '2b7ca9e1-3e0b-4255-8e8d-1d94ad09ef83', '397aac9a-b375-4a5e-83ad-2d4fbb006123', 'e58c2f42-5754-4b2b-8790-18fca6a2c789', '18d0b7c5-7172-467c-aeb8-dde4158cc41d']","['run-pdp11-code__NTdgZPu', 'run-pdp11-code__N9oDwyF', 'run-pdp11-code__PiUc77f', 'run-pdp11-code__ghwFg2f', 'run-pdp11-code__icjZfAk']",0,"[1021.511765, 1037.246064, 1000.023488, 1004.027911, 1005.871915]","[121.913552, 306.647338, 47.945604, 64.127699, 40.256]",0.0,False,[] +gpt-5-nano,sanitize-git-repo,5,"['f09e523d-0fd0-45c2-b101-c1a8ef503cf2', '5a203e45-b3c1-4c5e-a44c-968966050856', 'a4d1244e-5523-47f6-bdb3-9105806e6822', '3c935d1f-0e21-4915-a0f0-c864c86cc4ff', '97b9c356-a088-49e4-8679-f381cf237400']","['sanitize-git-repo__7KtLqif', 'sanitize-git-repo__tmKVyhR', 'sanitize-git-repo__o4QTJ5p', 'sanitize-git-repo__mhL7xMg', 'sanitize-git-repo__NkqtaPR']",0,"[924.750022, 900.283965, 902.627943, 405.671443, 908.925051]","[29.143158, 33.804276, 37.100204, 12.599637, 27.8439]",0.0,False,[] +gpt-5-nano,schemelike-metacircular-eval,5,"['ced38a76-1968-480c-9637-281d55b77a49', '4d28bf30-11b5-4523-8dc5-b37242f17efb', 'a62b93c8-943a-4e5d-8172-6feea1c1b309', '14b76156-e9d7-499a-bf38-fab27278a18e', '7ec6ec4c-0d5a-4260-977b-0c0dc8e7f983']","['schemelike-metacircular-eval__gHjoCMK', 'schemelike-metacircular-eval__EiWnM4r', 'schemelike-metacircular-eval__F8WvxyF', 'schemelike-metacircular-eval__feumVDA', 'schemelike-metacircular-eval__RjvpzkH']",1,"[2464.685159, 2411.539425, 2407.831533, 2401.299745, 254.080905]","[89.467904, 45.771447, 120.41469, 24.628754, 84.320935]",0.2,False,['ced38a76-1968-480c-9637-281d55b77a49'] +gpt-5-nano,sparql-university,5,"['f2032e58-77e6-40c7-95f0-2a63dbfe0eb2', 'b42b8e90-2dd3-412e-8d4b-452f43d9cd23', '835a120d-c9f8-4aae-b3f5-4782d58e004c', 'b0949005-d326-4368-bb29-5a4d5498bd7d', '9be7fb66-cc9d-43ee-b38a-6691c6ba27b0']","['sparql-university__GDCZSvy', 'sparql-university__9bpQzSC', 'sparql-university__fvqnATu', 'sparql-university__hFpZMRP', 'sparql-university__QMJTmaT']",0,"[907.096685, 908.425454, 923.192472, 103.284168, 933.821437]","[29.441514, 48.412181, 62.284153, 47.955859, 199.373061]",0.0,False,[] +gpt-5-nano,sqlite-db-truncate,5,"['b74023c2-0b20-451f-be53-7d2f0a7fc85d', '3b395af5-5331-46a1-a1ff-12a74bf2941e', 'c03d7a65-331c-4eff-bc96-f7303af5fca0', '4f236017-9f74-4364-81f7-7d15610c8391', '2f0ede3d-11aa-4de1-acef-e9c6adbb2d8a']","['sqlite-db-truncate__CZajf3B', 'sqlite-db-truncate__cy47BQC', 'sqlite-db-truncate__TrE3UES', 'sqlite-db-truncate__U6HnpxN', 'sqlite-db-truncate__ZrMAfN6']",0,"[904.584648, 308.390938, 900.049675, 907.407995, 566.002901]","[25.421632, 20.320564, 34.211853, 14.338999, 68.638223]",0.0,False,[] +gpt-5-nano,sqlite-with-gcov,5,"['a503c32b-3e8a-4d0f-9b42-dd7690124e76', '659a64cf-6cec-461d-be27-ba80f0230a3c', '3155d64f-1f4f-47c9-af01-b40e8f88f552', 'be43eefc-bb79-400a-800b-f91bac6bacdf', 'ed886b6a-946b-46f9-9e0f-56ad3c34a40b']","['sqlite-with-gcov__z7bxrvH', 'sqlite-with-gcov__ukUwNE6', 'sqlite-with-gcov__5SDkWGu', 'sqlite-with-gcov__rUDVxHq', 'sqlite-with-gcov__x5LzdxZ']",3,"[276.664172, 900.019909, 108.302722, 430.979574, 849.763498]","[42.556573, 46.86445, 36.363819, 41.211548, 33.628601]",0.6,True,"['a503c32b-3e8a-4d0f-9b42-dd7690124e76', 'be43eefc-bb79-400a-800b-f91bac6bacdf', 'ed886b6a-946b-46f9-9e0f-56ad3c34a40b']" +gpt-5-nano,torch-tensor-parallelism,5,"['efabd1eb-d108-4305-b8c1-ff9c54aca96c', '72538fad-95e1-44a5-82e5-0f0f6aebabbc', '5542b648-ca61-4a74-a236-8d32a5aeff5c', '7b6aef11-1000-4cef-824d-997cc749602d', 'b6921fc8-ba73-4754-a4bd-7e9b8c4c6252']","['torch-tensor-parallelism__djHnVAN', 'torch-tensor-parallelism__gzKyM6u', 'torch-tensor-parallelism__SQo9xd2', 'torch-tensor-parallelism__TQSRkJ3', 'torch-tensor-parallelism__LChtWid']",0,"[174.734081, 914.847544, 908.130843, 900.284344, 900.235168]","[36.151945, 18.999688, 62.49365, 100.595814, 47.411699]",0.0,False,[] +gpt-5-nano,train-fasttext,5,"['36635844-4c1b-4cf2-a891-30393acca1bc', 'da7071eb-7ea6-4e09-84e8-f6172fdd7a44', 'ba168e96-63f1-4d45-8f31-f41704d52b2b', '83552a4c-811c-4cef-b811-775616315075', 'ca3e0e83-4752-4c7c-8503-480d17fd56f6']","['train-fasttext__5hDYpr3', 'train-fasttext__kVe3ATn', 'train-fasttext__Z6rPDVS', 'train-fasttext__opDzVhz', 'train-fasttext__ERaXSJ3']",0,"[3600.692619, 3606.066432, 3603.687584, 3600.000437, 3647.866614]","[29.265173, 172.389943, 40.06923, 44.415026, 23.759746]",0.0,False,[] +gpt-5-nano,tune-mjcf,5,"['9ea1759f-a0f0-4248-9bcf-110e46e1d0e4', '4e9beb73-864a-45bd-91ab-fd5dbfce7627', '804df6d1-a32d-4a0b-a2c9-47338efebf93', 'be5762e7-756b-44df-a6fc-b975203b3131', 'bb0f568e-46fb-43a2-acf1-687610120f15']","['tune-mjcf__R7xrbzA', 'tune-mjcf__KATaEmq', 'tune-mjcf__vhULcoU', 'tune-mjcf__Qnjvuz4', 'tune-mjcf__qyrMoQx']",0,"[995.823158, 928.837663, 906.288846, 900.168726, 907.992166]","[65.912738, 33.940453, 24.470822, 10.038576, 15.572368]",0.0,False,[] +gpt-5-nano,video-processing,5,"['5e54f47e-bc87-4b9b-850d-83ff8aeb9e35', 'e8409ebe-6b1d-44d2-8bdf-d656c602f96e', 'ca764b9d-cd5e-4566-8e75-4d1075a4ac13', '70c6ce54-bfdb-4778-a3ee-2417ccebd570', 'c1de1b39-aca2-4d3f-b6e3-fff00b000e42']","['video-processing__NwfSW8N', 'video-processing__yUETUva', 'video-processing__9bpGvGA', 'video-processing__5xCAVDn', 'video-processing__YBh24hX']",0,"[138.784426, 138.731875, 273.32696, 145.175298, 125.773703]","[87.617388, 15.359664, 26.989172, 54.362225, 41.166143]",0.0,False,[] +gpt-5-nano,vulnerable-secret,5,"['880441ee-3aec-43a7-baf3-293c25ad9eea', 'f4299ba2-0bce-4100-8ec2-e682b85c30a2', '2116a837-169f-4d29-a5de-5211a5320707', 'c27036eb-23fc-40ce-a313-7a0fc794c843', '2d67f129-52e9-4c6a-8c0c-4f75f2ad4a50']","['vulnerable-secret__d9CEgX7', 'vulnerable-secret__TkcqHV3', 'vulnerable-secret__2ue85SN', 'vulnerable-secret__V7ojYbc', 'vulnerable-secret__DiyDUTf']",1,"[908.780874, 924.125589, 433.439086, 901.541733, 900.014226]","[90.241067, 13.083653, 22.902204, 18.4719, 9.152352]",0.2,False,['2116a837-169f-4d29-a5de-5211a5320707'] +gpt-5-nano,wasm-pipeline,5,"['9158073a-b01f-4bb3-b142-92498bcedcf8', '2ebf77d2-5ed9-47fe-b2f7-11ce9c4ffbc2', '71bf0f3c-ca18-454d-8ce7-106abe7e4ba9', 'a3404e18-f6b0-4207-bd75-0b9a2b98dce9', '9cb6db34-45e0-46be-b714-9a1b092c6ac6']","['wasm-pipeline__cAri6kf', 'wasm-pipeline__EpnDiyR', 'wasm-pipeline__dBrtf38', 'wasm-pipeline__HMNDsHT', 'wasm-pipeline__d3QjaY2']",0,"[906.744493, 938.986527, 910.489231, 902.398994, 912.719245]","[5.200794, 4.141474, 7.119983, 7.820365, 18.651275]",0.0,False,[] +gpt-5-nano,winning-avg-corewars,5,"['7467a2c2-8077-430d-a09e-21efbd2ae18c', '7b38922e-e1ea-4ce6-b06f-18b800884fe5', '6a93b939-3388-45eb-98d3-dc8e5e85a20f', '4b634c45-a1f4-4ab2-abd9-997754f63ec4', '8b84f7b9-c687-4450-b541-f728a4c46c39']","['winning-avg-corewars__aCJHqab', 'winning-avg-corewars__jVNSHdr', 'winning-avg-corewars__MsZYAkG', 'winning-avg-corewars__69jkFCU', 'winning-avg-corewars__G7tj6gV']",0,"[3629.853352, 3618.29844, 3618.360888, 3635.756976, 3609.666848]","[4.249909, 57.927897, 83.343403, 20.923098, 22.528442]",0.0,False,[] +gpt-5-nano,write-compressor,5,"['9d0b3277-b385-4924-8e40-bc9cb12e5ede', 'dcf0bfc4-fcd7-43f0-933d-6ec7de023f13', 'bca32fb4-5f4a-41fe-8de0-1e7b9508cee5', 'ed818932-8618-4b31-8753-c3eaadd6f6c8', '2861ea76-0488-4961-8258-ce153dd2c063']","['write-compressor__ceuLhG9', 'write-compressor__BUGvsmw', 'write-compressor__WK2SosT', 'write-compressor__gorcUa3', 'write-compressor__b7YNQ7D']",0,"[907.399624, 903.472232, 908.091282, 900.240016, 284.346443]","[45.484612, 80.367529, 153.248479, 43.997086, 48.513102]",0.0,False,[] +grok-4-0709,adaptive-rejection-sampler,5,"['00b1bab2-2ddb-409b-881d-96e44d4a6b59', 'a22b5c78-9c16-47cb-a16c-e934b5b17471', 'b6d8e351-37b1-4d5e-9141-6ad8945ad922', 'f5dae9b2-744e-4e6c-a873-872b5acbf278', 'fa5dad9c-0b43-465b-9fe6-3386e332def0']","['adaptive-rejection-sampler__3yFBvXg', 'adaptive-rejection-sampler__wK8bb36', 'adaptive-rejection-sampler__3pqfEa2', 'adaptive-rejection-sampler__L2LcSUD', 'adaptive-rejection-sampler__KdQD3YR']",0,"[931.346731, 661.345924, 900.161335, 906.756728, 902.628289]","[332.886544, 41.7219, 75.863891, 25.896889, 74.600856]",0.0,False,[] +grok-4-0709,bn-fit-modify,5,"['696069f5-30cb-4cec-a4a2-4c8e8658bd45', '798bee1c-abcc-48de-a764-383c2b54fc1a', 'b1ac6ea8-a88a-44f7-8a57-694326aea6cb', 'c0807dc8-ca09-4521-aefe-851e5f7b66ba', '55130153-64f3-4944-b1d7-811b02dbb23f']","['bn-fit-modify__f6tpV8c', 'bn-fit-modify__jFpy2M2', 'bn-fit-modify__XtLSRFg', 'bn-fit-modify__3zpgjqz', 'bn-fit-modify__fBu9eSt']",3,"[2622.69476, 2074.064092, 1895.533263, 3038.932611, 1829.417233]","[82.167968, 261.143466, 93.21949, 15.102587, 322.097892]",0.6,True,"['798bee1c-abcc-48de-a764-383c2b54fc1a', 'c0807dc8-ca09-4521-aefe-851e5f7b66ba', '55130153-64f3-4944-b1d7-811b02dbb23f']" +grok-4-0709,break-filter-js-from-html,5,"['1706e640-86f8-4cad-b7b2-4022e2d9e903', 'cea19262-85af-4737-b330-9a2005df59da', 'ebd41487-ff39-4a5c-bedc-c0ed11fd5334', '747858f2-7163-4aa8-ab35-9107d5fac434', '97ceaa3e-d5e3-4f47-ad94-42c699e3be23']","['break-filter-js-from-html__LMCzFb4', 'break-filter-js-from-html__rscWRbj', 'break-filter-js-from-html__tf4uoFm', 'break-filter-js-from-html__U4jKq4A', 'break-filter-js-from-html__e3j824h']",0,"[1212.536861, 1210.270347, 1200.099427, 1218.204018, 1200.040302]","[71.942703, 26.62191, 81.768342, 10.055971, 115.247883]",0.0,False,[] +grok-4-0709,build-cython-ext,5,"['b7a8dd81-2bf7-4193-b386-25cac1ee1d96', 'e9a5541d-2044-482b-8a7d-30debd7e6eba', 'dba4d961-5275-4b10-8f2e-c025a6d4c7bc', '6970fc53-2bee-4320-86ac-3b03800b481c', '76cf5a03-9456-4a71-b06e-325f103b3fd9']","['build-cython-ext__c7g2Ybt', 'build-cython-ext__if4KKvo', 'build-cython-ext__veEHtrR', 'build-cython-ext__y9CbhXL', 'build-cython-ext__goWCgEt']",0,"[900.3513, 904.099153, 910.697525, 919.754113, 900.017413]","[12.261046, 49.335577, 12.423724, 68.753046, 146.810235]",0.0,False,[] +grok-4-0709,build-initramfs-qemu,4,"['c8a589b7-1969-40cb-8acd-4a92970a856d', '8580107b-763a-48a6-9d83-973fd4fbb276', 'b5bf16ef-04e8-4633-8603-da2d849920e5', '1160389f-7de8-4a58-ab22-0fe95209e81b']","['build-initramfs-qemu__Vi5RFVZ', 'build-initramfs-qemu__bm8otR3', 'build-initramfs-qemu__EczCTJM', 'build-initramfs-qemu__63R9SvP']",0,"[913.24577, 900.0023, 900.00104, 954.757592]","[93.420197, 10.802765, 34.409105, 289.337469]",0.0,False,[] +grok-4-0709,build-pmars,5,"['4424ef95-e7a5-4ef2-8bfd-a277a0257087', '1a6b4329-8863-402a-b411-4774d0a93382', 'd5595a8e-5357-4d81-b28e-773ef9c34798', 'd04d7ced-13f7-42f0-b5ff-5c06ca095503', 'e402da3a-9b92-434e-9998-c2e82ebb1611']","['build-pmars__LXweBjm', 'build-pmars__7UMFbjK', 'build-pmars__uzW99sQ', 'build-pmars__ko4QvRi', 'build-pmars__nhFYJqr']",1,"[818.704025, 901.455583, 926.181533, 478.532829, 2063.595934]","[6.404799, 15.071605, 13.278981, 56.402505, 4.594696]",0.2,False,['d5595a8e-5357-4d81-b28e-773ef9c34798'] +grok-4-0709,build-pov-ray,5,"['ed55c741-b0d2-4367-84f1-9d4083274d72', 'ce97982a-1375-43c8-bf2b-c1426de2a205', '259a0e46-d613-45fc-9924-6c46b5dd62fc', '3bef001b-8719-4e2b-bdab-3d73d3557b26', '6840746f-28b9-47b8-b048-240080d9a164']","['build-pov-ray__taQ5EQt', 'build-pov-ray__vcQgEK2', 'build-pov-ray__hmrCiE6', 'build-pov-ray__wn7SYqY', 'build-pov-ray__XjwptTR']",5,"[1766.543346, 1882.814736, 1959.123888, 2279.359497, 1030.578869]","[57.395713, 118.352408, 31.794202, 74.271437, 48.450962]",1.0,True,"['ed55c741-b0d2-4367-84f1-9d4083274d72', 'ce97982a-1375-43c8-bf2b-c1426de2a205', '259a0e46-d613-45fc-9924-6c46b5dd62fc', '3bef001b-8719-4e2b-bdab-3d73d3557b26', '6840746f-28b9-47b8-b048-240080d9a164']" +grok-4-0709,cancel-async-tasks,5,"['d6f11601-42ba-4b67-9836-e28c3012b091', '0e217f67-8ed7-4304-b746-18b4136d6c74', 'd6acfbef-08ce-49ca-ad67-be04b9e885ad', 'b7071872-cfef-42fc-8a08-a1f8d172ce73', '982f1a75-0a33-4cd5-9802-5550c512ff9b']","['cancel-async-tasks__8tmyGKG', 'cancel-async-tasks__XSGhNhc', 'cancel-async-tasks__FJZ7gkM', 'cancel-async-tasks__WRcMdod', 'cancel-async-tasks__vmidpSm']",0,"[151.319581, 104.888625, 221.165722, 194.211972, 266.975641]","[17.594653, 31.97406, 180.854854, 85.957309, 94.360558]",0.0,False,[] +grok-4-0709,chess-best-move,5,"['faf4e312-450e-4fb2-bb93-b971ae700a88', '31b3becc-2ea4-4486-9d57-7441e852c7e0', 'be45e906-45c3-4604-b38f-dd3ff98216a7', '75686b99-aaee-470c-aa2b-218413f22ef6', '49b5b975-45b9-4de9-b40b-918804413fd0']","['chess-best-move__fNmKMyA', 'chess-best-move__wsrBdvz', 'chess-best-move__ungjZAy', 'chess-best-move__eKv9Vjp', 'chess-best-move__oYqURNc']",0,"[900.266951, 911.377773, 903.856588, 917.131429, 902.5297]","[8.296646, 145.737361, 13.950884, 66.936854, 38.539905]",0.0,False,[] +grok-4-0709,circuit-fibsqrt,5,"['d0cc5d13-8e80-4833-a3ee-3dbad4f2b037', '4e5a2fd5-7d67-499f-a773-85e4588ef92e', 'a1c06619-d5b9-456a-907f-3584559f0909', '70aa9ff5-6468-4b8f-b109-ba5ffcc1259b', '3503a565-bbc9-4a0f-a91e-1b71c23dfb4d']","['circuit-fibsqrt__6SoDfCX', 'circuit-fibsqrt__xtugp3v', 'circuit-fibsqrt__ZuAWLhP', 'circuit-fibsqrt__9gzMea9', 'circuit-fibsqrt__tJHCBFA']",0,"[3604.803117, 4113.21673, 3627.213903, 2062.591725, 3605.816061]","[39.057512, 33.774982, 28.110469, 92.756335, 75.903664]",0.0,False,[] +grok-4-0709,cobol-modernization,5,"['33d4e41d-b94e-4694-b922-4e9ead335775', 'b58843e7-272e-4ef2-938b-f02092be20dd', 'ed1466f2-e283-4eec-8d61-dac66e7afbba', '141d9282-e97b-4bf6-9fb8-75b76bc11444', '7b7d890c-264c-498b-b2ae-0e82d054f32f']","['cobol-modernization__oneNQZq', 'cobol-modernization__HYnHxEE', 'cobol-modernization__GKmMnuk', 'cobol-modernization__MWvU7bc', 'cobol-modernization__5QrRmWd']",1,"[914.904313, 900.037524, 616.530559, 877.583253, 900.722841]","[53.550057, 19.104814, 152.769592, 48.313065, 66.441487]",0.2,False,['141d9282-e97b-4bf6-9fb8-75b76bc11444'] +grok-4-0709,code-from-image,5,"['3cea762d-1761-4a8f-9ca0-cdb45e4c88c2', 'd5e22f1c-526e-425d-b8db-f69bcc7836bf', '536aeaca-c74a-4305-8323-bc75ad04e2d5', '5f4d3c93-9c43-44ed-9570-06627b7467be', '0a708b31-0c40-4b5a-a310-e245caca06b4']","['code-from-image__pcstASJ', 'code-from-image__BLgGsoe', 'code-from-image__XmRZitH', 'code-from-image__c9BjEGk', 'code-from-image__PjqpyXP']",0,"[1866.739917, 1209.333347, 1200.045356, 1200.001493, 1205.949286]","[65.701932, 50.277036, 67.055447, 24.847099, 58.17533]",0.0,False,[] +grok-4-0709,configure-git-webserver,5,"['c7b1a0eb-85fd-487d-b75e-75dfec728222', 'ed7b84dd-bba2-4bea-9a52-6e17019578f4', 'eb7fbc0a-f5bd-46e8-9a16-47ba53568a8a', 'e269aca4-75d8-41b0-bbd3-3226f107bec9', 'd2c4b380-05db-4bb7-a63a-0c01734eb850']","['configure-git-webserver__ffd95AV', 'configure-git-webserver__W8y59Ke', 'configure-git-webserver__7tEmay3', 'configure-git-webserver__6Q7VqaM', 'configure-git-webserver__TFubCTN']",0,"[406.447578, 336.824078, 537.516035, 487.545781, 382.319631]","[65.104852, 24.931034, 68.712787, 39.977063, 58.903135]",0.0,False,[] +grok-4-0709,constraints-scheduling,5,"['0f818b21-1780-46f0-a8f4-82fcbacddb4b', 'f1890747-ce51-4666-9ff1-658eeb017b38', '930aa83e-b2de-4276-beb6-732ac8381ff5', 'd8feae3f-17d0-4624-8fd9-36ef162a809e', 'ee96708e-0118-4235-8e55-98a88f1b505e']","['constraints-scheduling__zgBQJgK', 'constraints-scheduling__FKwVefA', 'constraints-scheduling__Aaib52J', 'constraints-scheduling__F6m8wKP', 'constraints-scheduling__iNHxh6V']",4,"[1101.814021, 1202.244716, 666.853623, 483.826994, 591.130595]","[25.820875, 114.625374, 146.979925, 71.841108, 72.903817]",0.8,True,"['0f818b21-1780-46f0-a8f4-82fcbacddb4b', '930aa83e-b2de-4276-beb6-732ac8381ff5', 'd8feae3f-17d0-4624-8fd9-36ef162a809e', 'ee96708e-0118-4235-8e55-98a88f1b505e']" +grok-4-0709,count-dataset-tokens,5,"['c2e8bfaa-e950-4939-ad1c-2c8c99e94b42', '9a54e3a4-4fe9-4c19-baf8-624080d4157d', 'c241138e-39d6-47e4-aa0b-9cc1f7ea66db', '74a1c787-b60d-44c2-b35a-41783a7b5cda', '98fa7820-ed8e-40ce-ae49-ce33282431a3']","['count-dataset-tokens__fbY3vmf', 'count-dataset-tokens__Btv7Qr3', 'count-dataset-tokens__dy3LTPx', 'count-dataset-tokens__FZez3Vm', 'count-dataset-tokens__RFLV7UP']",0,"[900.553353, 910.963149, 874.135824, 904.26028, 908.854239]","[18.038943, 36.196649, 56.019979, 54.924629, 22.404125]",0.0,False,[] +grok-4-0709,crack-7z-hash,5,"['1d1a0003-1f74-4815-81f9-6c945bc39b7b', '26171d54-02e8-46cd-9800-600bc07d26ff', 'cc9477e9-aafe-49de-be3f-7ea47163a9c5', '69f0f0fd-0164-4323-8bd5-703646feffe9', 'b3927f65-cccc-4385-a034-1d87da8d901a']","['crack-7z-hash__EKCzAJj', 'crack-7z-hash__zoBVVye', 'crack-7z-hash__cRH7yFo', 'crack-7z-hash__3mixp7j', 'crack-7z-hash__b9J6ryt']",4,"[900.02668, 664.890356, 735.856104, 524.937764, 402.887019]","[50.184469, 10.64557, 30.887908, 38.367556, 19.049414]",0.8,True,"['26171d54-02e8-46cd-9800-600bc07d26ff', 'cc9477e9-aafe-49de-be3f-7ea47163a9c5', '69f0f0fd-0164-4323-8bd5-703646feffe9', 'b3927f65-cccc-4385-a034-1d87da8d901a']" +grok-4-0709,db-wal-recovery,5,"['b4dcd200-3749-427a-aa0a-e020839f3326', '687f2dbe-36ce-4b71-9420-986a58a1c2cf', 'becd73ba-978c-4b84-874f-e2679e017d1a', 'f20d455e-6091-4875-bca0-54a50c72d59c', 'f370eed8-632b-4cc4-831e-4aeaaa26b316']","['db-wal-recovery__KgtLabe', 'db-wal-recovery__L4xo8sp', 'db-wal-recovery__yfUwJD8', 'db-wal-recovery__fDKFxhp', 'db-wal-recovery__sQYXGEj']",1,"[463.301235, 1019.140304, 914.233676, 909.460891, 904.090081]","[12.864054, 19.823356, 30.282768, 67.633445, 14.120635]",0.2,False,['b4dcd200-3749-427a-aa0a-e020839f3326'] +grok-4-0709,distribution-search,5,"['3da3b6c0-a617-47e0-816d-6715ad7d210d', '81fbbbc2-d765-42f2-8f1b-3c0f6f238e0a', '6271fe85-9d43-47f4-a2ac-f997485d4127', '0cfdc9ce-edfb-46c0-b7d3-67e1f4d08736', 'b02e366d-413e-45ec-bff1-c5270d7568b5']","['distribution-search__JwZyMP4', 'distribution-search__Y9Mf7Hk', 'distribution-search__bTyLt3n', 'distribution-search__y36XBqd', 'distribution-search__Z3dTna7']",2,"[721.909356, 439.210163, 624.848846, 455.419628, 1061.994976]","[205.81127, 34.645128, 14.125246, 124.234986, 146.107097]",0.4,False,"['6271fe85-9d43-47f4-a2ac-f997485d4127', '0cfdc9ce-edfb-46c0-b7d3-67e1f4d08736']" +grok-4-0709,dna-assembly,5,"['4df4f348-712f-4adb-87c3-ee00917faad0', '18ce2677-8cbc-4790-83ac-7c6cdf1d5359', '9fcc9d97-9d54-4400-acd7-c14e2b4fbe10', '9d979ae2-3d24-4dd2-88ed-78ff253fa3cb', '21eb4d38-b16d-403b-a017-0fd6fdd0555d']","['dna-assembly__u58Dizt', 'dna-assembly__36viAtq', 'dna-assembly__mDfReeQ', 'dna-assembly__BvVKkbB', 'dna-assembly__MsVuKvR']",0,"[756.442839, 749.650645, 720.096869, 720.005426, 774.724666]","[214.837107, 20.947184, 125.13312, 39.065493, 65.71613]",0.0,False,[] +grok-4-0709,dna-insert,5,"['6c6eef6f-67ac-400d-a0af-a2241eb9b183', 'a16bf79d-69fc-4f07-9bb9-f5bcad179bd8', 'ca690874-e570-4744-8edf-6cda0825e7c6', 'a35c3618-39e1-4a3e-a414-4e8c4336b4d4', '44294908-ecd5-430f-adae-accf696ae071']","['dna-insert__VomtXSQ', 'dna-insert__5tckwNb', 'dna-insert__yrn2Tvq', 'dna-insert__H7zPrca', 'dna-insert__LcyGS7E']",0,"[387.284604, 361.224911, 383.523004, 434.963809, 366.976216]","[42.068176, 18.602269, 39.031476, 37.924054, 51.341099]",0.0,False,[] +grok-4-0709,extract-elf,5,"['568e0102-19d3-4ef4-8bb9-cfaee50d42b1', '2afa9d84-5233-462a-b757-858c82a1db65', '110deeae-2808-416a-8065-00b657deab8f', 'b7a1be39-8872-4fed-b9c7-bcdddc372a93', 'b567729b-1838-46c1-8325-930ad2d31507']","['extract-elf__ax5qMUp', 'extract-elf__RPc7vKp', 'extract-elf__B26ssgf', 'extract-elf__Qp2P92T', 'extract-elf__hAdWW4A']",1,"[904.723108, 384.71568, 529.264059, 455.43338, 893.761135]","[23.957425, 45.447561, 43.2613, 175.920659, 58.388765]",0.2,False,['2afa9d84-5233-462a-b757-858c82a1db65'] +grok-4-0709,feal-differential-cryptanalysis,5,"['7f6e296e-e065-41d3-bf73-e5dc2eaca4a8', '6c0e03f8-62d1-41b9-974f-01cf02b5784e', 'c3ab2e21-8e5b-44e2-8cec-711608eb807a', '1a9ba0d6-aab8-40ce-bc4d-d9e277f114d2', '97ab00be-9882-466f-aa3b-b6dd87c118b4']","['feal-differential-cryptanalysis__5SmFMKz', 'feal-differential-cryptanalysis__PsM53BV', 'feal-differential-cryptanalysis__KLCPKUV', 'feal-differential-cryptanalysis__8DDkDSM', 'feal-differential-cryptanalysis__UcXuQbT']",4,"[731.298854, 811.234777, 768.951183, 826.135716, 1834.810201]","[216.174658, 24.200534, 65.189811, 21.996972, 46.573138]",0.8,True,"['7f6e296e-e065-41d3-bf73-e5dc2eaca4a8', '6c0e03f8-62d1-41b9-974f-01cf02b5784e', 'c3ab2e21-8e5b-44e2-8cec-711608eb807a', '1a9ba0d6-aab8-40ce-bc4d-d9e277f114d2']" +grok-4-0709,feal-linear-cryptanalysis,5,"['7fd45ec5-7685-4c14-99d4-81750630eecf', 'ce9404d9-5f38-4b79-9763-acec983732d4', 'ed22019e-8b53-423e-87c8-4dd2ce68fba2', 'c45a7639-2529-4821-874e-f8736b1d4bd5', 'ebf4450e-6699-45ff-a837-a4ecb300cf9b']","['feal-linear-cryptanalysis__fAZQ8h7', 'feal-linear-cryptanalysis__drAzjka', 'feal-linear-cryptanalysis__4iFm4Ep', 'feal-linear-cryptanalysis__hUd5TT3', 'feal-linear-cryptanalysis__hojUndp']",0,"[1803.391062, 1810.901472, 2322.54027, 1801.016086, 1814.053289]","[95.018461, 71.52591, 42.437032, 21.210591, 13.954343]",0.0,False,[] +grok-4-0709,filter-js-from-html,5,"['1c15cc11-ba44-4d52-ad7e-a73a84f059e4', '221a7e3b-c57c-44b1-b91d-04ee856cd993', 'f9f8216f-5f56-4763-a81a-c484b33fe3dd', 'a588cf8c-0309-462a-9867-e86db0eda599', '85aa4dc2-4b65-4ed9-9b1b-060c97b3d881']","['filter-js-from-html__2j2QGUq', 'filter-js-from-html__86TDfUP', 'filter-js-from-html__Dh9W5ay', 'filter-js-from-html__WNTkXEX', 'filter-js-from-html__iXkgdEk']",0,"[319.098513, 527.277799, 737.144572, 409.077527, 266.375329]","[125.49057, 50.790237, 92.084856, 64.631727, 33.216059]",0.0,False,[] +grok-4-0709,financial-document-processor,5,"['d6b4176b-6a74-4ad7-9760-c05bb64a5445', '4c5a08ad-beed-4be3-ba32-f30d3f4a178e', 'f9640edb-8613-4300-8701-477c0512c7b0', '04d108d2-5331-41d3-8e72-9ae4921c3632', 'df091b11-f901-4785-9e12-343f5885e082']","['financial-document-processor__CAaEAUd', 'financial-document-processor__R87UVUj', 'financial-document-processor__aqRdTaq', 'financial-document-processor__tKnF3vk', 'financial-document-processor__pWEq4XC']",0,"[1225.359464, 566.509606, 501.25845, 801.320454, 496.659992]","[292.625339, 29.594311, 20.272569, 118.234884, 139.258447]",0.0,False,[] +grok-4-0709,fix-code-vulnerability,5,"['f8d2d477-e5eb-49df-a9e8-69ffa83b56da', '8ee45d2f-2056-4400-b3ac-af56b68be3ec', '8c31613f-334d-4ba5-8540-e574dfbd92d9', 'ddfd4110-01a6-41a0-83d1-26bea4615157', '07ebf929-fb6b-4afd-a2f2-833e7dcedc67']","['fix-code-vulnerability__P3TQLD9', 'fix-code-vulnerability__NVxsZzE', 'fix-code-vulnerability__DBpctsu', 'fix-code-vulnerability__sY2gPnB', 'fix-code-vulnerability__vVReddX']",1,"[900.000633, 900.848946, 994.054723, 947.287169, 912.346991]","[9.384136, 76.158752, 39.570593, 5.316983, 74.318405]",0.2,False,['8ee45d2f-2056-4400-b3ac-af56b68be3ec'] +grok-4-0709,fix-git,5,"['d04c0a1b-f507-48a2-b04a-449174b0d17b', '8051cf7f-2de6-4865-9cf9-dc1973d1ee78', 'bfaa828b-aea2-4736-887b-bc7a3b9e3710', 'a742096c-f8d9-4d04-9d79-c00645ff09a8', '0a0351d6-8b38-4172-a848-ae94a42cf371']","['fix-git__QhpzhQH', 'fix-git__v6KhnjY', 'fix-git__hnRchHe', 'fix-git__jXbPyPt', 'fix-git__hFU3eP9']",5,"[355.122256, 167.355702, 572.73406, 245.989973, 154.096906]","[73.795986, 26.735726, 32.631393, 38.783413, 45.337869]",1.0,True,"['d04c0a1b-f507-48a2-b04a-449174b0d17b', '8051cf7f-2de6-4865-9cf9-dc1973d1ee78', 'bfaa828b-aea2-4736-887b-bc7a3b9e3710', 'a742096c-f8d9-4d04-9d79-c00645ff09a8', '0a0351d6-8b38-4172-a848-ae94a42cf371']" +grok-4-0709,fix-ocaml-gc,5,"['6dd8dd37-af93-4da9-a56e-f981c0f6851e', 'eabd3d58-5bb4-4d58-b80f-845cdd96e3f0', 'a8977b2d-872f-4cd9-9242-3e58c6e5e4f0', '83591efe-5a9e-4f61-811c-521af2c39eac', '1695b04b-4ecd-4a43-92e9-c7fd5b10402e']","['fix-ocaml-gc__gnVMfyw', 'fix-ocaml-gc__PV6mgJT', 'fix-ocaml-gc__i8yo4oD', 'fix-ocaml-gc__WRX2XYS', 'fix-ocaml-gc__RQwHs3M']",0,"[3602.41715, 3600.003152, 2283.769183, 3697.597806, 2947.333315]","[46.494506, 33.643887, 55.110679, 68.928685, 118.880309]",0.0,False,[] +grok-4-0709,form-filling,5,"['17675549-e130-45c0-a7ed-c3cfcc2add4f', '22eb9328-282e-4bf9-84c1-a46f90d9299e', 'da706fb1-2911-44ce-9a5d-38d12e5dc16d', 'a4a62168-cb3a-4df7-8fe7-8f13eb40ca3b', 'e56b2f2e-27e6-4ffb-b1f5-30fe3491bd10']","['form-filling__tMuP6ZR', 'form-filling__ZJLSZYo', 'form-filling__hxFgNgj', 'form-filling__nG2Sexd', 'form-filling__U5KuUMo']",1,"[372.071094, 502.933091, 248.24216, 310.68523, 470.98634]","[9.513546, 4.887268, 22.481224, 42.379212, 4.590014]",0.2,False,['22eb9328-282e-4bf9-84c1-a46f90d9299e'] +grok-4-0709,git-leak-recovery,5,"['d4162ea2-8493-4e15-a5f6-bc1dd14ec251', '6dde1c14-c37f-4421-810b-912e270dc377', '9258c28c-fc1f-409e-99b6-83c31c426301', 'b2d61631-fc6e-4445-a924-ccaee1f73275', 'e1c5f95a-d825-4f41-9020-5feb24e4361a']","['git-leak-recovery__yCjB7Sa', 'git-leak-recovery__f5SFs9q', 'git-leak-recovery__4uBfMst', 'git-leak-recovery__iS5Mybz', 'git-leak-recovery__C5GYqFK']",2,"[290.075708, 503.906558, 235.720213, 902.611469, 202.910628]","[59.043812, 16.504101, 83.1286, 19.566895, 41.465167]",0.4,False,"['9258c28c-fc1f-409e-99b6-83c31c426301', 'e1c5f95a-d825-4f41-9020-5feb24e4361a']" +grok-4-0709,gpt2-codegolf,5,"['2645a1f5-2ae3-4937-a1eb-f51f8e44f383', '068b22e5-4ec3-4ff9-bd5b-fc2229c75dc6', '45a7bbf1-8574-4af4-b6fd-87a10037f3ec', '2444cc8f-d451-4a1b-899a-2d3fb4229814', 'eedd1016-cf0a-4448-a5fe-876954b7edf1']","['gpt2-codegolf__KnrcVSr', 'gpt2-codegolf__6FSHXsS', 'gpt2-codegolf__4zB7USr', 'gpt2-codegolf__dsi5JLN', 'gpt2-codegolf__qawpebS']",0,"[165.626822, 200.419406, 342.080994, 115.686724, 192.891878]","[84.68002, 70.998073, 192.181054, 25.4771, 369.926849]",0.0,False,[] +grok-4-0709,hf-model-inference,5,"['66874905-467a-4e9d-b645-bc7fdb1f7bde', '2b0e296c-80b8-44e6-8b45-c8deb9d78897', '3182f1f2-49c3-417b-946c-117e2712bf7d', 'a85b0731-f46b-401f-b2ec-75a5b5bed178', '7ea72d4f-78c9-4030-a7fb-47eadf1a88f5']","['hf-model-inference__qU2AEfq', 'hf-model-inference__rx4vMeG', 'hf-model-inference__r6PwJmZ', 'hf-model-inference__kdP7567', 'hf-model-inference__8kHhkbQ']",5,"[291.083538, 438.960544, 552.151505, 460.246729, 422.673379]","[15.47582, 30.255316, 33.380878, 108.450675, 65.52859]",1.0,True,"['66874905-467a-4e9d-b645-bc7fdb1f7bde', '2b0e296c-80b8-44e6-8b45-c8deb9d78897', '3182f1f2-49c3-417b-946c-117e2712bf7d', 'a85b0731-f46b-401f-b2ec-75a5b5bed178', '7ea72d4f-78c9-4030-a7fb-47eadf1a88f5']" +grok-4-0709,install-klee-minimal,5,"['00a18e70-ca97-4d39-9498-a6abc8b5772d', '470630eb-8d41-48ef-ab42-92678266fc54', 'c5e70346-269f-42d7-b983-310c86ca648e', 'b176b07f-ca2d-408e-aa9b-3414a26fc467', '4ce324e8-aa9f-4215-a07c-8dc7bd4e0b75']","['install-klee-minimal__CUFLu3D', 'install-klee-minimal__U6M4qtN', 'install-klee-minimal__QLBoFvm', 'install-klee-minimal__vo8oRE9', 'install-klee-minimal__BuHHkyY']",0,"[900.017379, 902.858161, 900.094078, 908.183209, 900.096919]","[64.200008, 65.912101, 106.486168, 36.624284, 37.737509]",0.0,False,[] +grok-4-0709,install-windows-3.11,5,"['68db99b7-51c6-4ea6-a594-d3044733dc58', '0593056a-8060-43e3-a9ef-66e912f11d26', 'd2bbee39-1247-4ccc-9029-fb321b3ea40b', 'd8751f5b-3420-49c9-834e-8aeffa48bb6d', '312e49dc-7896-4864-a075-c1ddb7717349']","['install-windows-3.11__j5TD4dp', 'install-windows-3.11__dtSdHnD', 'install-windows-3.11__Z6kD3tF', 'install-windows-3.11__jUotwTb', 'install-windows-3.11__Sd9zmW6']",0,"[512.911126, 1168.214581, 1085.602217, 316.196732, 342.682359]","[63.316284, 40.396391, 39.925673, 30.51819, 12.802232]",0.0,False,[] +grok-4-0709,large-scale-text-editing,5,"['4d43befe-7cf9-406a-9aec-36fbdea7bc47', '255d41b0-9bda-4df7-8fed-0231f3d3cbdd', 'c93402dc-192f-498c-8db8-247f1b3249cf', '72545f41-4ed1-423b-86b1-e54954e7c83a', '92f03e5e-f64d-4837-ba30-bdeff5bcc39f']","['large-scale-text-editing__QX5DZWf', 'large-scale-text-editing__YiPeBym', 'large-scale-text-editing__eSnZgZr', 'large-scale-text-editing__Sb8ncEh', 'large-scale-text-editing__zWnECvt']",2,"[384.673622, 579.085318, 1200.487176, 341.078518, 631.20016]","[333.266163, 262.151259, 164.644045, 21.282727, 96.126821]",0.4,False,"['72545f41-4ed1-423b-86b1-e54954e7c83a', '92f03e5e-f64d-4837-ba30-bdeff5bcc39f']" +grok-4-0709,largest-eigenval,5,"['f56cf574-254b-454d-86db-ac4381a25790', '3fab5d00-5e53-4e88-99fd-c5e220b7c866', '06f54a6d-e2e8-4543-aefa-23f6f8aa2259', 'db138fc4-725e-4613-b599-6823738a4c07', 'b1fbb71f-78b9-4d03-9cc2-b15ecd62fba8']","['largest-eigenval__wSYMTwg', 'largest-eigenval__k94Z3Hv', 'largest-eigenval__jKBKZu6', 'largest-eigenval__iANyPDn', 'largest-eigenval__kP8uMUE']",0,"[901.437261, 913.75097, 900.051819, 902.725174, 962.51849]","[36.325171, 69.314496, 41.387829, 49.543292, 322.531519]",0.0,False,[] +grok-4-0709,log-summary-date-ranges,5,"['9200626e-5e9f-4f21-b9cb-ea295228b32d', '39a66b04-2c14-4dbe-8f26-410f4e360fba', '2ead6217-9dce-439d-8ba7-f6af67734429', '3310e3ad-6f71-45af-88bc-1c4dc494de54', '788f1075-8cd5-4b60-ae3d-e0ac40e8934c']","['log-summary-date-ranges__YyCRLuq', 'log-summary-date-ranges__KFdY3Wc', 'log-summary-date-ranges__oQoqNyj', 'log-summary-date-ranges__wSffpmT', 'log-summary-date-ranges__oZRAVuX']",0,"[328.253905, 914.86037, 561.700113, 457.625986, 909.086372]","[70.73825, 121.900783, 78.478186, 163.840262, 19.514994]",0.0,False,[] +grok-4-0709,make-doom-for-mips,5,"['c46ca70b-7d11-484c-b1f4-880a6ae0029b', '45b665b8-f440-4cf7-89e2-00df40c64b76', 'b52b7e65-ce21-41cb-a3e6-5f956ab3c49f', '4e3b12d9-097a-41cc-9cb9-76841944c92c', '7408f7b8-4c3b-43e1-afa4-58538450a4b4']","['make-doom-for-mips__YfZvNA7', 'make-doom-for-mips__hGGPRSG', 'make-doom-for-mips__HSTygsw', 'make-doom-for-mips__6R89wfW', 'make-doom-for-mips__XcpuXwy']",0,"[762.002849, 915.446561, 909.325168, 610.240123, 908.349769]","[22.524949, 78.991176, 47.817966, 206.901226, 48.503273]",0.0,False,[] +grok-4-0709,make-mips-interpreter,5,"['88a9cd3e-5be0-4bcb-8324-dd7580bf5a62', 'b1ad8645-9ee0-45e0-aef7-a491a07d3393', 'b6be878c-b1ce-4536-9327-b321767ea855', 'ad31bfcb-f729-46f9-993d-82cad9da3d46', '6b4fb7be-8759-4512-b17d-f08c0998233e']","['make-mips-interpreter__U4U969B', 'make-mips-interpreter__Aiys2mU', 'make-mips-interpreter__CwS23pL', 'make-mips-interpreter__g3dPS9P', 'make-mips-interpreter__a4cotJR']",0,"[1803.162384, 1809.511643, 2057.934995, 1801.307985, 1802.716715]","[121.172384, 112.449852, 21.767716, 31.084974, 98.564426]",0.0,False,[] +grok-4-0709,merge-diff-arc-agi-task,5,"['69c75112-05e5-45e8-8986-73703ce702b6', 'acea63b2-219b-4724-a789-b6833632c03c', '1987feb4-4849-4179-abb2-cc106198eaf0', '4455e51e-5067-490f-aa31-7f835f910562', 'efeacfb3-e638-4c44-8d65-015f25a4ea31']","['merge-diff-arc-agi-task__x24g4CV', 'merge-diff-arc-agi-task__3YoA8hA', 'merge-diff-arc-agi-task__GboF8fD', 'merge-diff-arc-agi-task__7WcgYcQ', 'merge-diff-arc-agi-task__aEi8c3o']",2,"[902.316225, 581.150503, 914.198965, 907.250697, 888.551456]","[22.397383, 34.641001, 67.195418, 169.388256, 59.532061]",0.4,False,"['acea63b2-219b-4724-a789-b6833632c03c', 'efeacfb3-e638-4c44-8d65-015f25a4ea31']" +grok-4-0709,model-extraction-relu-logits,5,"['c7e7cf38-c6d3-4748-89cd-e6ad56e3c377', '675d9cff-07e9-4229-8683-ac5672b88e93', '70c077a3-acb3-4766-b887-a3ee5e3a0fa7', '06458568-ee0f-499e-b3af-380fd4396614', '5e91e6d4-f503-43f3-8689-d04f56832f19']","['model-extraction-relu-logits__THUEudU', 'model-extraction-relu-logits__KYWUxqA', 'model-extraction-relu-logits__Bd5wnos', 'model-extraction-relu-logits__9Miodzu', 'model-extraction-relu-logits__tEFLUi4']",0,"[925.749087, 900.479796, 1164.229483, 848.49283, 900.119196]","[15.170008, 58.099096, 37.87, 104.350225, 24.515645]",0.0,False,[] +grok-4-0709,mteb-leaderboard,5,"['a6589e35-a4b3-4b7c-a093-d3757a8b52f2', 'eca6dbc7-7f19-4ecc-9c63-c9d8cf7cf3fa', '3c5b00a7-5aa4-4d35-85ba-0bdaf4de0e53', 'adc1a977-1904-489f-bc6c-17e19fc5abe5', '7bda9cf0-03c1-4c6d-93dd-d0407cc75b0d']","['mteb-leaderboard__MAcoSe3', 'mteb-leaderboard__BoWMPRJ', 'mteb-leaderboard__cjDjZEK', 'mteb-leaderboard__p3Kisuh', 'mteb-leaderboard__XAd5Rzc']",0,"[330.339313, 189.639165, 187.180532, 155.60713, 247.911355]","[8.442264, 8.246268, 32.674822, 16.123655, 63.776601]",0.0,False,[] +grok-4-0709,mteb-retrieve,5,"['0f5b59f4-62d2-4ca9-880d-d689c3ba5736', '6cdfca9a-d1d2-4121-9068-b54e593e747e', '94cc043f-9ecf-4557-bbb8-70d1fc7fd678', '5f319ce4-f7c9-46c9-be10-dc4663a3af32', 'f20a9116-c776-419b-abad-2d1964329e2f']","['mteb-retrieve__dkuXduH', 'mteb-retrieve__UEbHeyc', 'mteb-retrieve__hB5G7JP', 'mteb-retrieve__5ugpVM6', 'mteb-retrieve__a2WpsYq']",0,"[508.654613, 534.025029, 295.140364, 209.238869, 283.055218]","[5.918316, 23.064595, 13.019908, 13.76269, 93.722656]",0.0,False,[] +grok-4-0709,nginx-request-logging,5,"['d7656e62-144b-43f0-8f15-e61ca9299d66', 'b1e3d7a6-61f6-4b8d-bd3a-fa8314e7955a', '7ded1b3b-dd51-472e-9233-1a5f6557ad7c', 'a717d196-ee77-4c28-a6ae-b8c6f3463115', '1ee83146-5264-419a-8ef7-4596ef601e8e']","['nginx-request-logging__2sPL9eh', 'nginx-request-logging__EVhURJU', 'nginx-request-logging__mpperGD', 'nginx-request-logging__Lc5QUzT', 'nginx-request-logging__hfLvXKd']",5,"[900.498498, 396.256201, 353.170968, 277.766512, 559.380688]","[161.782828, 14.523332, 49.208807, 58.734665, 36.225168]",1.0,True,"['d7656e62-144b-43f0-8f15-e61ca9299d66', 'b1e3d7a6-61f6-4b8d-bd3a-fa8314e7955a', '7ded1b3b-dd51-472e-9233-1a5f6557ad7c', 'a717d196-ee77-4c28-a6ae-b8c6f3463115', '1ee83146-5264-419a-8ef7-4596ef601e8e']" +grok-4-0709,openssl-selfsigned-cert,5,"['95fdc1a7-ef46-44fe-93b4-d1b20c433e3f', '0edb2b34-cecf-4acb-af41-074d52ea8bc8', '801a87e7-f9c7-40ff-affc-9c5b7b800f46', '243dff01-b3ef-4e14-8257-b3be2f483061', '23a4a582-67c6-4159-883e-a943c3f75781']","['openssl-selfsigned-cert__BFhZ78P', 'openssl-selfsigned-cert__bF5eNfz', 'openssl-selfsigned-cert__zA9wSGb', 'openssl-selfsigned-cert__vwnpoze', 'openssl-selfsigned-cert__V727kSE']",0,"[163.036398, 116.44857, 242.801096, 183.724676, 200.871489]","[32.195952, 50.407021, 54.532331, 45.129356, 68.977359]",0.0,False,[] +grok-4-0709,password-recovery,5,"['b8a17eea-4b3f-43e5-8c6c-15f0677e92c9', '2317eb39-2e5d-4794-8b57-c4a87b9f7051', '4fae0c4c-f3c1-48a0-8d6d-31e283f316ed', '0637f413-3133-44ff-aee1-76d8758bd7d8', '0024b61a-5730-447a-b355-529ac5632ea4']","['password-recovery__KEYqm8M', 'password-recovery__GbpD4p7', 'password-recovery__jany3s9', 'password-recovery__ednBhwC', 'password-recovery__VG8ku8k']",0,"[903.627722, 907.419619, 1549.61206, 904.304843, 900.413332]","[16.52749, 71.122712, 159.418437, 38.709117, 17.161631]",0.0,False,[] +grok-4-0709,path-tracing,5,"['2eaca569-3442-4e32-a371-93c7e9f40804', 'b3806b10-c331-4cfc-b6af-c6deda827499', '76ab802c-6b26-4ea4-b150-61ae2d8e1a36', 'e18682a6-1072-4f7f-9fda-a91471928efb', 'f53e27a8-4827-418c-9499-f5fbf86990b8']","['path-tracing__PkrMwuF', 'path-tracing__eiyHLns', 'path-tracing__QvSEbSs', 'path-tracing__x3DajA6', 'path-tracing__mvwzD57']",0,"[1802.646409, 1800.046095, 1860.298814, 1800.08514, 2025.897205]","[206.853162, 31.274793, 36.207341, 91.718863, 268.944356]",0.0,False,[] +grok-4-0709,path-tracing-reverse,5,"['0265fe6c-a1dc-4955-8713-c6a8b726103e', '70f41658-a133-40d4-bfdc-b98565172e7a', '7b1d24c4-36ab-4ab0-ad25-19af08413b90', 'cab7fb13-e843-4940-b200-1a2265760aac', 'f8b7fbb3-a2fc-4501-b10d-38fb307a3fc5']","['path-tracing-reverse__dWdnbXM', 'path-tracing-reverse__LjDoPT3', 'path-tracing-reverse__Ph5SZyZ', 'path-tracing-reverse__NkMjRQd', 'path-tracing-reverse__uJN3rHc']",0,"[1856.440668, 1802.345362, 1816.671305, 1807.948347, 1832.513526]","[72.558709, 31.038622, 139.992015, 123.333602, 59.967138]",0.0,False,[] +grok-4-0709,polyglot-c-py,5,"['e11f644c-e4e6-41ae-a36f-a95f138e6e40', '81e43f3a-062a-4da3-9460-0848453b8b02', 'b4e61eba-c320-4f78-a1f2-263dfe3d793d', '741cef4b-4f50-4cc5-8c41-9c2ea1e0ba65', '457db808-3feb-4f3b-b00b-07d11365529f']","['polyglot-c-py__Sg8k3eG', 'polyglot-c-py__m2iqa5N', 'polyglot-c-py__rERfuPq', 'polyglot-c-py__XEHri7S', 'polyglot-c-py__ZJw7UXV']",3,"[902.57269, 488.151746, 166.432063, 280.463774, 606.481813]","[40.030165, 50.334199, 19.685069, 43.319571, 61.781564]",0.6,True,"['81e43f3a-062a-4da3-9460-0848453b8b02', '741cef4b-4f50-4cc5-8c41-9c2ea1e0ba65', '457db808-3feb-4f3b-b00b-07d11365529f']" +grok-4-0709,polyglot-rust-c,5,"['a7ca0d02-2ecb-45c1-b9d9-088ebeed125d', '5b60c6ed-f72d-44e0-9f34-6841be37abb2', '5804a8e2-432a-45e9-8c15-2a038a5549bd', 'fec93a22-3d7f-4957-af2d-7ff66628cd40', '44278ba4-f261-43c2-8ab6-715e3102d544']","['polyglot-rust-c__BxynGQz', 'polyglot-rust-c__sdMZUAf', 'polyglot-rust-c__jp6Qgx2', 'polyglot-rust-c__rKjcJxF', 'polyglot-rust-c__gZNJ2p8']",0,"[900.176969, 926.205025, 900.109638, 746.174398, 906.139468]","[12.326077, 61.412449, 111.435751, 106.22706, 179.87701]",0.0,False,[] +grok-4-0709,port-compressor,5,"['27d6791b-6b93-481f-a9e5-3da67c2c0004', '677bd8bc-ab5e-4a94-b354-58709e0c0e5e', '5d24890c-e8c7-4b64-bf3e-5d645f7280ec', '703cef0a-8a76-489b-8c63-9a9e8c553222', '0497da47-e286-4ad6-b580-4c2aaf40463c']","['port-compressor__suMimpc', 'port-compressor__aKjxS8k', 'port-compressor__srLhkR3', 'port-compressor__jqKZknu', 'port-compressor__RJFFYYf']",0,"[3602.36234, 3600.002399, 3605.33934, 3623.846709, 3610.970821]","[114.979538, 24.181994, 75.662811, 67.601791, 151.642992]",0.0,False,[] +grok-4-0709,prove-plus-comm,5,"['833951b4-feb0-4d46-84e3-d9e215ee1736', 'ab3d2779-b0d2-4960-8c7f-5c1c30ee59f4', '21342448-ee8a-43a7-b5e1-ed20b3eb879a', '1bf5a051-bb8f-43fd-a21d-0a9144ada50a', 'e4ba06d7-4687-4dcb-b03f-e6b8ee40946c']","['prove-plus-comm__5XGznsr', 'prove-plus-comm__vUQLmXL', 'prove-plus-comm__K9ZN5ga', 'prove-plus-comm__PiypLZN', 'prove-plus-comm__Du6VbkQ']",4,"[329.157309, 638.25612, 464.475587, 904.255835, 339.93954]","[42.905596, 65.711057, 141.650614, 92.122501, 13.197934]",0.8,True,"['833951b4-feb0-4d46-84e3-d9e215ee1736', 'ab3d2779-b0d2-4960-8c7f-5c1c30ee59f4', '21342448-ee8a-43a7-b5e1-ed20b3eb879a', 'e4ba06d7-4687-4dcb-b03f-e6b8ee40946c']" +grok-4-0709,pypi-server,5,"['daebf798-83c0-43d4-8c1c-991bd40fe682', '599ac243-d17f-4296-93a6-dd29dd392cf5', 'b0ed129d-4062-4e12-b953-32c327456a9d', '36561de2-0b6f-4cf4-b168-8d295dc546c0', '3c42443c-6c5c-4293-a265-8e3096636f2c']","['pypi-server__whGc8s2', 'pypi-server__HFHJVLb', 'pypi-server__VvyBmDL', 'pypi-server__9Y9oMNM', 'pypi-server__NMQV9fn']",2,"[364.268693, 907.239492, 271.967675, 249.580629, 491.081837]","[172.014937, 36.647686, 68.789692, 101.37842, 36.351382]",0.4,False,"['599ac243-d17f-4296-93a6-dd29dd392cf5', '3c42443c-6c5c-4293-a265-8e3096636f2c']" +grok-4-0709,pytorch-model-cli,5,"['b01012d5-9bbb-4f15-a205-39120ca6a1d7', '18c5e280-cd7b-42a3-8625-6a1fbd4d6efa', '58af97cc-c69e-4149-ac6b-7bc71db7a0e1', 'f0025690-0fbf-431e-b9c2-82f174c012dd', 'd2d30452-33d6-4e06-92cb-c7e671f1c114']","['pytorch-model-cli__j6PWGpR', 'pytorch-model-cli__evaXuDT', 'pytorch-model-cli__dhGeuuW', 'pytorch-model-cli__bKkrPiW', 'pytorch-model-cli__3cAMMcA']",3,"[795.579642, 603.207313, 900.494879, 900.033448, 767.715527]","[70.600339, 79.360548, 98.990695, 87.219098, 68.174861]",0.6,True,"['b01012d5-9bbb-4f15-a205-39120ca6a1d7', '18c5e280-cd7b-42a3-8625-6a1fbd4d6efa', 'd2d30452-33d6-4e06-92cb-c7e671f1c114']" +grok-4-0709,pytorch-model-recovery,5,"['049de1a0-a73b-4a1f-8dd4-fc6e15cd3155', 'b76be109-c175-4aa4-9fcc-ad35c48685ca', '5001f33a-d49b-4725-b868-40a3a9f0088a', '1410e098-b1a6-4180-85c0-df5f0aeb58ab', '1a723b17-4731-4f68-bd20-c1789dabf8ea']","['pytorch-model-recovery__UcgrR5g', 'pytorch-model-recovery__qHxddoN', 'pytorch-model-recovery__VWoZtqv', 'pytorch-model-recovery__wZKkpAx', 'pytorch-model-recovery__HNFpohk']",1,"[909.795331, 900.0293, 903.527938, 912.813393, 903.574306]","[109.968589, 58.010634, 59.770187, 13.371827, 53.699598]",0.2,False,['1410e098-b1a6-4180-85c0-df5f0aeb58ab'] +grok-4-0709,qemu-alpine-ssh,5,"['90c3eb82-fe6b-4932-be3d-0839a4e097c3', '5945d0c2-36de-4049-9a35-b2b880dbc9d1', '1de69a71-f848-469d-8298-eb18cde45f23', '2b6c5890-4caf-443f-aad0-3cf6b29704b5', 'a1cac633-be56-4e41-9681-7cdcbe606461']","['qemu-alpine-ssh__fRHZXFn', 'qemu-alpine-ssh__dnH8ezG', 'qemu-alpine-ssh__zh5E84q', 'qemu-alpine-ssh__hf7eWCN', 'qemu-alpine-ssh__pPV6L9f']",0,"[251.76765, 557.619939, 960.69337, 361.872523, 374.229161]","[64.226152, 33.799688, 5.254821, 17.760785, 9.912209]",0.0,False,[] +grok-4-0709,qemu-startup,5,"['1a92c906-f747-415f-babd-2d320d28e92f', '1d5bee34-f592-45be-aadb-8c81bc0d8f11', '3110eea4-e036-4e60-be14-5a47c5b6d9ab', 'a44da1ed-b12e-4153-b5e1-fdd171eab7ac', '3742f7fd-53b0-4929-8c19-9f94b828f836']","['qemu-startup__WHzHWXd', 'qemu-startup__PG5rkPX', 'qemu-startup__hBFAWE4', 'qemu-startup__mDYFnqC', 'qemu-startup__TK4EK89']",2,"[478.122418, 902.780115, 904.662798, 1018.743296, 916.980591]","[43.706974, 3.222935, 120.408926, 108.419783, 11.791007]",0.4,False,"['1a92c906-f747-415f-babd-2d320d28e92f', 'a44da1ed-b12e-4153-b5e1-fdd171eab7ac']" +grok-4-0709,regex-log,5,"['d1a11941-1001-450e-a4d7-8255463153e1', '1321e30a-e0d9-49de-820e-1d7e4daed94a', '9eb34595-3c66-4ac0-ae58-bc728fa1c68f', 'dbafe363-3c24-4999-93cb-a804603d4e3b', '6b36c97b-3559-4a3e-970e-5956fc28f34c']","['regex-log__QW4LYhD', 'regex-log__qEvyRUR', 'regex-log__imGpKxe', 'regex-log__6JgARjt', 'regex-log__MUXRNpj']",3,"[326.288649, 302.33619, 235.37137, 583.490481, 267.028883]","[179.927601, 260.751217, 157.700824, 24.965019, 47.10468]",0.6,True,"['d1a11941-1001-450e-a4d7-8255463153e1', 'dbafe363-3c24-4999-93cb-a804603d4e3b', '6b36c97b-3559-4a3e-970e-5956fc28f34c']" +grok-4-0709,reshard-c4-data,5,"['cf09e239-52ba-4487-bd57-7bda44ceab33', '8577cfaa-3a2a-46cd-a6de-54c6eae6dfc7', '77befbd9-2073-4e41-9c2c-f79641ad5a09', '7f0add51-8baf-4af7-b687-d4a6ae1de47f', '34deb58a-e735-4c87-b523-c955da1913ae']","['reshard-c4-data__4A8CJtU', 'reshard-c4-data__8odNf5j', 'reshard-c4-data__QiAhmS9', 'reshard-c4-data__56corGS', 'reshard-c4-data__nufSorN']",0,"[906.846254, 901.523752, 901.086579, 909.682071, 1685.104608]","[67.799498, 23.181315, 50.62469, 55.408604, 46.526885]",0.0,False,[] +grok-4-0709,reverse-engineering,5,"['cc7195b5-5151-42d3-ae73-74e475f5a503', 'f8dfcd45-b710-4072-b509-82c145e95350', 'a6d26931-9a2b-4a2c-ae40-d0c8af583cb9', '58c7f7cc-eafd-422d-9c35-a18728eb653d', '5292ba24-b51f-4f30-8994-7e01ce27d17d']","['reverse-engineering__ewmZQET', 'reverse-engineering__kgrJS6w', 'reverse-engineering__xo5nGKF', 'reverse-engineering__VMSb86f', 'reverse-engineering__v82NYbD']",1,"[1802.557031, 2616.468792, 1800.064454, 1800.96446, 777.174587]","[46.743662, 27.034955, 74.181022, 9.9225, 50.469579]",0.2,False,['5292ba24-b51f-4f30-8994-7e01ce27d17d'] +grok-4-0709,run-pdp11-code,5,"['5a1ada2c-70ec-4daf-9f8d-de86b690f113', '58cc3941-88a0-455e-9ffe-4a0e05525d85', 'fc4cfd33-df42-4460-916c-27d847a43da8', '96ce99b7-bb4e-4d7b-9751-80b65d681237', '1cbdd164-b331-4539-8f4d-76ea079c3d6c']","['run-pdp11-code__ZT2iMh7', 'run-pdp11-code__t9vfKkA', 'run-pdp11-code__PzUT4eu', 'run-pdp11-code__FE5R57o', 'run-pdp11-code__mRSPdkv']",0,"[1007.772376, 1002.790046, 1023.539085, 1002.96926, 2470.05237]","[71.995189, 26.655058, 72.892545, 42.844949, 320.739305]",0.0,False,[] +grok-4-0709,sanitize-git-repo,5,"['6b61bf73-d2ea-416e-9a77-37fcac2543da', '9d5649f7-075e-4a87-b075-5d7ced8de2b0', '1aebe770-0355-487b-9581-e63b532da6c9', 'fa7ff783-1934-4c01-9b1c-89f429100981', 'b18ebde1-486f-498f-b12b-5bf7caf922c9']","['sanitize-git-repo__JtjARbn', 'sanitize-git-repo__gMgU3Ms', 'sanitize-git-repo__GCJA5yB', 'sanitize-git-repo__HosMXvx', 'sanitize-git-repo__siDf2zj']",0,"[516.96535, 340.71191, 705.613592, 458.522079, 1012.415013]","[34.955331, 30.678908, 33.532302, 21.579042, 313.539499]",0.0,False,[] +grok-4-0709,schemelike-metacircular-eval,5,"['d7be9106-ba94-4e23-963b-6117831f4c34', '27d5a996-8f33-4373-ae7f-1b57de147385', 'ff190d1a-d2a0-4418-bb98-59957e4a1c69', '76e202bc-cf52-4ece-9ced-ae342005c907', '9b34ad22-6c18-4ff3-a2bd-29077c0ac4fa']","['schemelike-metacircular-eval__korMXBL', 'schemelike-metacircular-eval__pNErsDy', 'schemelike-metacircular-eval__P7gp28E', 'schemelike-metacircular-eval__KkjAiJV', 'schemelike-metacircular-eval__XF9tAah']",0,"[1481.990202, 2414.199164, 2409.700032, 2418.080746, 2406.90402]","[90.133257, 43.904185, 98.174899, 109.60219, 35.786101]",0.0,False,[] +grok-4-0709,sparql-university,5,"['8b012a4f-39f6-4bf0-af46-fda21c0af6cb', '5ef428bd-2533-4283-95f8-2cece4c55e0b', 'e6aec74e-ef43-4284-aaab-941e2deb72a0', '0fab9ddc-e434-4ccd-8ffd-b2056f48fabc', 'd1be0bfc-4226-46a5-8467-44764d0f4b63']","['sparql-university__YsYq7sS', 'sparql-university__nr4nTEh', 'sparql-university__BmEHjPQ', 'sparql-university__J2F8tkR', 'sparql-university__HJdYLwV']",2,"[900.042243, 386.212565, 399.804394, 524.92489, 389.847928]","[49.681883, 38.956237, 28.576189, 140.856188, 57.921443]",0.4,False,"['5ef428bd-2533-4283-95f8-2cece4c55e0b', '0fab9ddc-e434-4ccd-8ffd-b2056f48fabc']" +grok-4-0709,sqlite-db-truncate,5,"['d4049088-08a1-4225-b023-2d1de1163a3c', 'ea726cef-402c-4aaf-80f0-e3c7b63ed41a', '617ec320-3bc9-445e-89b1-015a3f635150', 'd14ba659-84d1-40f4-b2b7-50edccf6a54a', 'e8444f28-f310-4040-9cb2-c61d2b17f419']","['sqlite-db-truncate__9KKBqQd', 'sqlite-db-truncate__eUj8GpQ', 'sqlite-db-truncate__RZesyFG', 'sqlite-db-truncate__GrTD3NR', 'sqlite-db-truncate__GS4Tr2t']",0,"[910.658276, 900.016756, 314.616573, 798.584089, 909.078122]","[150.784498, 34.503438, 58.310283, 13.604757, 56.191604]",0.0,False,[] +grok-4-0709,sqlite-with-gcov,5,"['744de146-7724-4b53-acea-752d69c10461', '4d5ff12b-68ee-44cb-81a9-dbed85895112', '57c1989a-50ee-4c3b-bf67-13e2e5c00e26', '62815651-ed06-4c4d-88a3-ebeab792569d', '5356da93-6806-4a5e-9ab2-9acf4ad08a2d']","['sqlite-with-gcov__USAosgZ', 'sqlite-with-gcov__ypFyqdY', 'sqlite-with-gcov__9SXc9vh', 'sqlite-with-gcov__v4kPCm2', 'sqlite-with-gcov__FbQxAac']",0,"[491.128847, 482.71818, 652.025607, 697.407031, 441.053005]","[95.121206, 33.8257, 30.244754, 45.388245, 77.434444]",0.0,False,[] +grok-4-0709,torch-tensor-parallelism,5,"['87d93e13-ab4a-4fe3-a171-c60698fafd88', '9d0be9a1-0b68-4a59-8733-3d9a723d6d7b', '4ac52660-8dfd-44ee-8788-728c6bae2047', '1fbd249c-4d0d-4973-b580-82522aaf5e7c', 'e60f5092-6053-406e-9736-379d4abdc560']","['torch-tensor-parallelism__eVptzzE', 'torch-tensor-parallelism__Z5y5FLN', 'torch-tensor-parallelism__5RfW6Mi', 'torch-tensor-parallelism__JfgLezk', 'torch-tensor-parallelism__XkRZQUH']",0,"[306.449619, 182.975585, 558.002263, 812.482565, 653.851522]","[142.277816, 62.759891, 31.215196, 28.321854, 47.331159]",0.0,False,[] +grok-4-0709,train-fasttext,5,"['d46da707-f363-421d-a013-9f55fa03bc25', '87950f72-f3a3-4b05-8f32-a298dbd2a7b8', 'c4357ef5-fce0-4ac9-b1e7-6475f44322eb', 'e85c93ef-5a1e-49f9-82de-fb84a96a5aa2', '1214de4f-0f26-4299-98c6-a6466657c114']","['train-fasttext__o6Yfyfa', 'train-fasttext__NYUZQmF', 'train-fasttext__gX9z2nb', 'train-fasttext__796TkcX', 'train-fasttext__Dd4uipw']",1,"[3601.974087, 3621.500217, 3646.909724, 2002.210252, 3600.00844]","[46.440656, 24.033943, 20.610252, 23.383759, 33.430853]",0.2,False,['e85c93ef-5a1e-49f9-82de-fb84a96a5aa2'] +grok-4-0709,tune-mjcf,5,"['f4b565ee-d020-4275-b01c-2f537519bee1', 'dc10df82-13c8-4561-8a00-f9d41d73eb40', '502c635d-4bef-4b74-b097-662d75cd3bcb', 'a9544ebb-ae24-4d40-bd06-a6a7924202c0', 'a9021d08-4108-4d4a-8ef0-541b67f3ea5d']","['tune-mjcf__5SvBwUu', 'tune-mjcf__du9HHbQ', 'tune-mjcf__neAUAmA', 'tune-mjcf__XSAti6E', 'tune-mjcf__JojREM6']",0,"[929.268954, 900.081627, 903.215264, 903.023304, 907.29432]","[32.503665, 9.860652, 68.771226, 14.754604, 14.70339]",0.0,False,[] +grok-4-0709,video-processing,5,"['3a93cf5c-a5ea-49e4-8b6d-5faaa625fb56', 'bed5c58a-67a6-4675-8181-9de60c149ca3', 'e3432469-bc98-4649-955f-c43d27d5eec5', 'bc525386-45b2-4772-902c-65513e8adb60', '7ccb38d2-3176-48cf-a5c1-9bef862ba465']","['video-processing__fYQqfWN', 'video-processing__f2vZmTo', 'video-processing__cumV5x3', 'video-processing__tQER8Hj', 'video-processing__DGgh7ik']",0,"[252.691189, 311.753488, 185.652558, 239.463111, 1404.157416]","[26.694555, 83.070919, 13.84833, 59.373614, 25.535616]",0.0,False,[] +grok-4-0709,vulnerable-secret,5,"['1d595ab4-6d13-4782-a2aa-d16f21026d9d', '1ee4effa-e62b-4eee-91f2-ddf6a6db9821', 'f97dc390-b7ba-4935-bf82-f79e02d159dd', '4b204004-32c6-4344-aa67-cb8b31b93f32', '8d60cb79-0ef3-40ce-9f9e-b842c69a3e02']","['vulnerable-secret__sWm3Xxb', 'vulnerable-secret__ifuH4oc', 'vulnerable-secret__WLi9ySN', 'vulnerable-secret__77B4SxC', 'vulnerable-secret__g58AGNp']",3,"[767.651047, 900.19694, 841.34485, 901.390157, 923.415844]","[29.477426, 13.231331, 10.05726, 11.102102, 12.726763]",0.6,True,"['1d595ab4-6d13-4782-a2aa-d16f21026d9d', 'f97dc390-b7ba-4935-bf82-f79e02d159dd', '8d60cb79-0ef3-40ce-9f9e-b842c69a3e02']" +grok-4-0709,wasm-pipeline,5,"['45321289-eb82-4da9-baf1-67854c074334', '57dfbc3a-5fe4-4138-ac2e-9e096cd2525e', '09a4e990-4665-43ed-9ca7-88ffb38cf655', 'e19214c7-11e0-4d3c-be5f-60e01bac3915', '959c199e-d8c0-4844-bb2c-a935554d12b8']","['wasm-pipeline__rHS3Zf3', 'wasm-pipeline__HZae7PK', 'wasm-pipeline__qrZTiVh', 'wasm-pipeline__Y493qZk', 'wasm-pipeline__Jz5ipUC']",2,"[919.291095, 859.199082, 475.233157, 510.127774, 676.326044]","[12.305849, 4.92177, 4.141565, 11.022535, 11.91841]",0.4,False,"['57dfbc3a-5fe4-4138-ac2e-9e096cd2525e', '959c199e-d8c0-4844-bb2c-a935554d12b8']" +grok-4-0709,winning-avg-corewars,5,"['eef73477-a988-43f9-8501-ab54dbab36b0', '9f3a78ae-9fdb-4762-98b4-774eeeaa2cf7', '31481f3f-1733-40df-9020-3bed9c3f3bda', '9791aaad-5e69-43a1-8380-d5a05935faa0', 'b75addfe-e049-4cad-85b7-3c8cbff30918']","['winning-avg-corewars__CjmovLx', 'winning-avg-corewars__QBmaFxa', 'winning-avg-corewars__bZwPMQK', 'winning-avg-corewars__rEX5ZQs', 'winning-avg-corewars__iDaQkHx']",0,"[3616.264834, 3604.435153, 713.651057, 3626.878843, 3617.640234]","[36.861142, 15.178494, 37.096644, 4.964962, 84.391467]",0.0,False,[] +grok-4-0709,write-compressor,5,"['da1e135a-1f9b-43f3-b01a-3c48f74205cd', '30145c9c-5e21-4eca-93ff-7e627799214b', '944582c8-707e-4b74-891b-c763a689827c', '6f35d2a2-4ad5-4fe6-b0e2-22f99e24418f', 'ba414c4f-042f-4d73-ba2a-c4bc05eee3c8']","['write-compressor__hbf8DUB', 'write-compressor__38jiktB', 'write-compressor__DqrkDq6', 'write-compressor__utZMTXj', 'write-compressor__oGu7d7N']",0,"[904.310914, 900.477512, 908.163267, 903.095772, 934.074333]","[33.578032, 46.529131, 152.018348, 78.120371, 72.167589]",0.0,False,[] +grok-code-fast-1,adaptive-rejection-sampler,5,"['aec6612e-395b-4562-b6b0-654398923805', '2adc619d-8a1d-4ea0-9101-5bfa8b40e1c4', 'e32b8814-b4e0-4773-8baf-cad93412979b', 'e61b7d43-d9de-483d-9ab5-7234d8248388', '92e85f30-8eca-4068-8444-d23552bc115d']","['adaptive-rejection-sampler__vPeicaJ', 'adaptive-rejection-sampler__YdqasT5', 'adaptive-rejection-sampler__gWAGrpL', 'adaptive-rejection-sampler__RrQYfYK', 'adaptive-rejection-sampler__jFARYew']",0,"[488.475857, 567.466922, 310.526187, 236.884964, 283.63497]","[54.775634, 139.908242, 38.419084, 60.964755, 25.978215]",0.0,False,[] +grok-code-fast-1,bn-fit-modify,5,"['96d921ad-2d82-4847-aca9-27bc88441a3c', 'c879060f-a87f-417c-a6a9-5664e8ad0470', '77d7cbae-288b-4ea7-9d0b-df6f4b4279b9', 'cf241e94-fd59-4019-88fd-ebd85e1a36ce', 'f08ccb40-eb68-4e21-a713-7ff8d95324a6']","['bn-fit-modify__QAuwhmE', 'bn-fit-modify__zGVGGtN', 'bn-fit-modify__9Mf3z3x', 'bn-fit-modify__bK9s5sg', 'bn-fit-modify__KXuDr8C']",0,"[514.002196, 1031.690114, 369.947591, 1394.598372, 1107.363996]","[97.904057, 254.74621, 22.274197, 68.26349, 109.382806]",0.0,False,[] +grok-code-fast-1,break-filter-js-from-html,5,"['8452678e-763f-4333-afff-48fe64f6082d', 'bab6229c-b11f-4c20-8b67-c20987478ac4', '15d28e88-e51c-4aa6-b41f-bc09a440a57f', '6f65eda1-c81b-4f27-998a-10a5aa38b875', '6f2286cb-37a3-427f-affa-a247a637b3f6']","['break-filter-js-from-html__LcKdwuX', 'break-filter-js-from-html__BWnjF5m', 'break-filter-js-from-html__iSbAvqr', 'break-filter-js-from-html__7FJHpTk', 'break-filter-js-from-html__Q68TAiq']",0,"[299.814663, 476.606194, 796.159249, 582.49914, 149.44933]","[13.318754, 89.936257, 91.184523, 141.634927, 91.631806]",0.0,False,[] +grok-code-fast-1,build-cython-ext,5,"['99406396-6b9a-474f-92bc-c372074309ba', '30faa2f0-06a9-45ed-b6fe-484514542f19', 'd2cb35a7-181d-4335-bc70-a9906dde9e7d', 'd4416e2d-af9f-42b9-814f-622638fc47c1', '72a03d34-a27c-4f1c-a23d-606c3ba778d8']","['build-cython-ext__K58ouPT', 'build-cython-ext__QwUh5pp', 'build-cython-ext__tcPh4uV', 'build-cython-ext__xmNBYGC', 'build-cython-ext__jKPsUyv']",0,"[705.459425, 912.264186, 908.508152, 788.534485, 480.811365]","[151.595963, 74.174826, 73.575948, 94.403218, 8.10517]",0.0,False,[] +grok-code-fast-1,build-initramfs-qemu,6,"['9e9a2d24-9b23-4a95-a8e1-2cb8ef75fbe5', '04968b24-13d5-41f7-8863-8a20b73666bc', 'd709b652-fce6-4d3b-8dd2-eb88402bf317', '6d490062-4b3f-45a3-8ccb-6464cf9f007c', '72041167-8233-4bcb-8065-704fec899395', 'd5a6d572-6933-49c6-ab6a-d2927bb7aca4']","['build-initramfs-qemu__MXGr6aV', 'build-initramfs-qemu__TU8XJPa', 'build-initramfs-qemu__Ke5FpLB', 'build-initramfs-qemu__k7HtJSp', 'build-initramfs-qemu__TxxzgpA', 'build-initramfs-qemu__Q8ixi8w']",0,"[37.845297, 148.588737, 138.400149, 46.849707, 80.830086, 45.989782]","[7.436033, 97.089522, 41.646591, 7.067805, 22.844732, 21.775057]",0.0,False,[] +grok-code-fast-1,build-pmars,5,"['da970409-acf6-4732-9876-2e7b5b18c88a', 'e3cc33a2-fdc7-4956-92ca-7ad94ee08590', '8f1b0971-ef33-4ec6-9412-552af16195cd', '4aa51b5d-590b-4b70-95b9-932dd4828580', '9cc75497-c668-4dc6-81be-000a051c3d42']","['build-pmars__z2Ps8bz', 'build-pmars__7qCHW2C', 'build-pmars__RNiRZfh', 'build-pmars__gNvxVwU', 'build-pmars__bpDFgob']",4,"[482.589914, 330.507402, 783.378833, 921.134999, 905.676879]","[8.862004, 48.879993, 33.778137, 5.198246, 18.754611]",0.8,True,"['da970409-acf6-4732-9876-2e7b5b18c88a', 'e3cc33a2-fdc7-4956-92ca-7ad94ee08590', '8f1b0971-ef33-4ec6-9412-552af16195cd', '9cc75497-c668-4dc6-81be-000a051c3d42']" +grok-code-fast-1,build-pov-ray,5,"['cde3bd3f-dda3-4702-a08a-4262816d2115', 'a03d1eb8-1ef8-4993-beda-0d1aa75a858d', '9e365c1e-fc30-4efe-8a9f-867caa971807', 'bced4c14-26c3-4a76-a701-2a0668122540', 'b233acb8-c9ac-41b7-aa8f-5528feb90190']","['build-pov-ray__27dvdUa', 'build-pov-ray__grL5i2P', 'build-pov-ray__FasRzsD', 'build-pov-ray__gUpGH7K', 'build-pov-ray__Z9TaXtN']",1,"[2396.423036, 1235.74473, 2571.284066, 188.477947, 1342.738897]","[33.167702, 43.352415, 75.523229, 97.735558, 57.405531]",0.2,False,['a03d1eb8-1ef8-4993-beda-0d1aa75a858d'] +grok-code-fast-1,cancel-async-tasks,5,"['63ac2895-a7c5-483d-a577-165dc14fb79f', '938e8490-0734-4060-8e96-96cb4326be15', 'b17d3a4f-8dd6-4be9-8994-8c94e7baea62', '1153a511-4f5a-4df4-a342-b1946cacfab3', '10ca91fd-31f4-4ef3-a567-3932041a0352']","['cancel-async-tasks__HmioFNx', 'cancel-async-tasks__L5jM63c', 'cancel-async-tasks__aw9pTqt', 'cancel-async-tasks__VN5STLW', 'cancel-async-tasks__K6iphNr']",1,"[165.10426, 99.131105, 50.394023, 58.514461, 66.96576]","[170.165035, 101.306308, 60.352141, 31.032858, 96.090336]",0.2,False,['938e8490-0734-4060-8e96-96cb4326be15'] +grok-code-fast-1,chess-best-move,5,"['208b35c4-fb6f-4a58-8c9e-47a6c2532430', '4d772dfc-a25e-4c74-9ee6-adb56a3a5d5d', '465c0eb3-2a7c-4df1-b74d-7bd97a67aa0b', '06f4219a-bdb7-47dc-861f-e1f5531db679', '64ca0768-162b-49b4-95dc-510047e96b06']","['chess-best-move__9FSN2K6', 'chess-best-move__dxKd5nd', 'chess-best-move__NiXzqqE', 'chess-best-move__AWYbAGD', 'chess-best-move__cF5gras']",0,"[66.885994, 747.076536, 505.857087, 47.413769, 64.335596]","[13.213447, 36.625548, 66.706009, 10.671914, 169.679213]",0.0,False,[] +grok-code-fast-1,circuit-fibsqrt,5,"['93f981af-778f-42d2-967e-db8f6bf96c44', 'b90c822e-69ca-49bb-bb60-4d22384970f7', '1819721b-f274-40fc-b555-94bfc70da60a', '2c7ec8df-5d88-45c9-9e73-954e41eeffcb', '8253632a-5d6e-4cbb-9b1e-17e764ef1f3b']","['circuit-fibsqrt__TyuJFi9', 'circuit-fibsqrt__qFDoFe2', 'circuit-fibsqrt__FUqkybw', 'circuit-fibsqrt__zuLysJi', 'circuit-fibsqrt__Gqb4qsq']",0,"[356.702902, 310.520974, 283.542628, 204.260426, 202.291142]","[90.718562, 57.296618, 25.481372, 17.828966, 17.71854]",0.0,False,[] +grok-code-fast-1,cobol-modernization,5,"['a39e4c84-ce1a-4423-98a8-c935982a9dc9', '014bc748-6694-44a2-a6dc-ee732ffbb905', '260cd378-8b62-4c46-9701-2d6db990c7f0', '193e3363-8b25-4836-b7c3-863aa886a4f2', '8b5c92dd-4b5c-40db-86a0-7f930db8c8c5']","['cobol-modernization__gry355G', 'cobol-modernization__vfs9RLv', 'cobol-modernization__YiSp2PZ', 'cobol-modernization__T85UJyy', 'cobol-modernization__yga2uja']",3,"[775.841924, 153.668445, 141.010751, 105.695752, 403.320067]","[122.831318, 62.680914, 53.233185, 76.541478, 71.693585]",0.6,True,"['260cd378-8b62-4c46-9701-2d6db990c7f0', '193e3363-8b25-4836-b7c3-863aa886a4f2', '8b5c92dd-4b5c-40db-86a0-7f930db8c8c5']" +grok-code-fast-1,code-from-image,5,"['686fb927-8a47-4d41-aa5a-30b8e72e08a8', '677b8b59-0e58-41d6-8504-0f75cb8be454', 'c886dc20-b62b-4425-94e2-f1486061badf', '6ebac9dd-0263-486c-8321-3f14341cf178', 'd14f3394-d572-4330-937b-5fd9afa9841e']","['code-from-image__Uw5dVdj', 'code-from-image__hGmJBRU', 'code-from-image__sHGMYRm', 'code-from-image__oneF3f9', 'code-from-image__hYJTzS2']",0,"[130.496806, 297.290677, 343.988905, 254.830644, 1866.610925]","[20.674846, 54.752772, 119.008989, 81.80255, 65.692655]",0.0,False,[] +grok-code-fast-1,configure-git-webserver,5,"['d4b97c07-8f82-40c3-83fb-b6ec8b5665d5', '8853c917-ff48-4149-aca0-95a2a327bd4b', 'f9402f1d-67fe-4233-a686-9ff67787619b', '85bded94-4836-4fbb-8f52-e9db02b46261', '56b6ccfa-b007-4cf4-965e-6d02ab8f80f1']","['configure-git-webserver__oRTkKsV', 'configure-git-webserver__8Mpbw8f', 'configure-git-webserver__oQa4WCD', 'configure-git-webserver__XjTv8o8', 'configure-git-webserver__3sCXkX4']",0,"[155.284657, 266.269946, 159.346256, 97.397409, 384.738326]","[63.277077, 109.61811, 59.035354, 40.233406, 66.962352]",0.0,False,[] +grok-code-fast-1,constraints-scheduling,5,"['98c24cda-934d-4b66-8665-73d09202625b', 'ce4b5553-f0fa-46a9-a805-7a1b280a580f', '206a9c8e-e70f-4a0d-8e2a-34222840df5b', 'ea4eb20d-cead-4887-8ab6-af9ebb140d1e', '72df27a6-6388-444c-8136-2f3c5e524404']","['constraints-scheduling__4tGotLx', 'constraints-scheduling__2i8eYe8', 'constraints-scheduling__fXQ7PUt', 'constraints-scheduling__YC9JJHX', 'constraints-scheduling__ukyTVat']",4,"[457.227131, 283.639193, 83.74445, 147.825986, 188.243495]","[218.229088, 24.635606, 66.754101, 111.952894, 98.355355]",0.8,True,"['98c24cda-934d-4b66-8665-73d09202625b', '206a9c8e-e70f-4a0d-8e2a-34222840df5b', 'ea4eb20d-cead-4887-8ab6-af9ebb140d1e', '72df27a6-6388-444c-8136-2f3c5e524404']" +grok-code-fast-1,count-dataset-tokens,5,"['9a631723-ce2f-4fca-9639-65bcee16011a', 'de8815d3-c935-4a74-a7fe-af4eccf048c6', '6b160cb1-2a3d-4543-b97d-7e66763896b6', '8a802119-742c-4c1c-aa94-e684193f40ee', 'e3d620b9-73cb-40d1-b0ba-495a6f98440a']","['count-dataset-tokens__RkVaHDb', 'count-dataset-tokens__yeFDbzn', 'count-dataset-tokens__c3F5o5i', 'count-dataset-tokens__3w4GwGb', 'count-dataset-tokens__WgsbyfQ']",0,"[340.246446, 255.548271, 773.919599, 935.432369, 525.354606]","[17.085104, 42.022251, 16.870941, 132.38195, 22.916181]",0.0,False,[] +grok-code-fast-1,crack-7z-hash,5,"['9c19395b-df4b-4347-bf84-cdf2065c6b3e', '334a7b50-49b5-4f5e-a239-f27ec1039d41', '4f48eaee-cc2e-4f71-9624-fefc9da2945a', '8fb2ad7c-7b16-4470-82fe-37bfd913d0c0', 'd0738b88-a75e-451b-841c-1e47cd219ac8']","['crack-7z-hash__H4McsnJ', 'crack-7z-hash__cKz585Q', 'crack-7z-hash__vbd8KxF', 'crack-7z-hash__LhQZDvr', 'crack-7z-hash__MzdvN6Q']",3,"[907.556997, 916.788392, 657.528846, 307.733225, 759.74762]","[15.657556, 47.963805, 71.282344, 7.538281, 26.369054]",0.6,True,"['4f48eaee-cc2e-4f71-9624-fefc9da2945a', '8fb2ad7c-7b16-4470-82fe-37bfd913d0c0', 'd0738b88-a75e-451b-841c-1e47cd219ac8']" +grok-code-fast-1,db-wal-recovery,5,"['938d6b2d-b5c7-404f-92ce-5226f75754c8', '30f4fee6-65ac-45c8-aae0-14db8e776602', 'd9ff0f91-4bd3-4746-bf1e-e9f733eea15b', '46a6738a-f320-454b-8109-a38fc5a7b9c7', '174a95cd-d2b2-491a-add5-353b4ef89347']","['db-wal-recovery__tGGcKwg', 'db-wal-recovery__ugkfXp3', 'db-wal-recovery__7ZP4Zpa', 'db-wal-recovery__6ymHPFy', 'db-wal-recovery__WwneXNk']",0,"[122.183828, 511.038757, 490.638608, 255.988499, 160.907653]","[15.264434, 42.013809, 79.734635, 54.305985, 13.758175]",0.0,False,[] +grok-code-fast-1,distribution-search,5,"['99491274-4346-4e7c-a348-ac0036295123', '249dca27-0cc7-4d7a-b9b4-6aad31ae3139', 'a952debc-fabe-4421-9ef7-053739177604', 'b2473772-5749-4e59-a09e-1f8fb863711c', '6509474a-58f9-4e6e-8606-432b533503e4']","['distribution-search__mfX3hC2', 'distribution-search__YHneWgp', 'distribution-search__2bzs9nv', 'distribution-search__RFMgNJP', 'distribution-search__k5LKqfg']",0,"[218.328378, 192.206809, 267.021554, 415.286067, 366.596882]","[156.311474, 204.248832, 28.907811, 64.493176, 27.209669]",0.0,False,[] +grok-code-fast-1,dna-assembly,5,"['e8f24a2b-32b5-4992-82ed-07ed48d2fa10', '28107a4a-8f31-47f0-a3fc-3bcc76503248', '90e9dde5-ba53-40b8-9429-5899f7cff37b', 'fedddab2-c70d-4c8e-8a2e-55e952b992fb', 'eda5dfea-e3ea-4ca3-857b-604d9f1b352c']","['dna-assembly__9uZSewM', 'dna-assembly__Ve6HQ8p', 'dna-assembly__9pMAgoH', 'dna-assembly__T4SAz4G', 'dna-assembly__qrPZBvf']",0,"[120.414696, 59.790115, 197.337656, 720.266035, 138.63623]","[64.093481, 118.027122, 38.93602, 67.684421, 180.656408]",0.0,False,[] +grok-code-fast-1,dna-insert,5,"['1f869daf-56d3-4393-8e53-c986c3d92a13', 'e3a55e78-036b-42c2-b8e3-8f7d6756eeea', 'e456e088-f414-4e9b-b591-afe167b303f5', '78e2e2b6-991b-4273-834d-4955844f83ee', '4d0065a9-4aa6-411b-8936-449279085253']","['dna-insert__M5SXhmz', 'dna-insert__sAictNd', 'dna-insert__xbwGfvj', 'dna-insert__C2z64vh', 'dna-insert__izarQvS']",0,"[170.686827, 146.885531, 385.976852, 190.506054, 368.980774]","[86.583694, 18.463913, 41.062818, 19.275755, 305.22415]",0.0,False,[] +grok-code-fast-1,extract-elf,5,"['3df39360-b769-4bf1-b365-32dc8564cc64', '4e3a4215-049d-47d9-a8ac-a3632ab8024d', '59230b88-d3e4-4114-b784-a545e4d4f7ec', 'f0579349-bf5f-4ab0-9dc8-b1428c3242cb', '1dc5f35b-3e1f-474d-bd59-4d5ef6928bbc']","['extract-elf__dzdx9ou', 'extract-elf__t6ybZed', 'extract-elf__g5SHvdS', 'extract-elf__CbZVBQ5', 'extract-elf__HjYVNmU']",3,"[91.67386, 282.526449, 96.344268, 301.160626, 340.772261]","[32.56533, 94.994233, 22.956898, 87.246238, 32.020706]",0.6,True,"['3df39360-b769-4bf1-b365-32dc8564cc64', '4e3a4215-049d-47d9-a8ac-a3632ab8024d', 'f0579349-bf5f-4ab0-9dc8-b1428c3242cb']" +grok-code-fast-1,feal-differential-cryptanalysis,5,"['4c9bf875-99a7-412f-8550-8dd08811189a', 'f94a492f-d93f-46e1-a3cf-24d0237f98b0', '0b052031-7b5f-4406-95cf-d6f2e4be43d3', 'cf8fc772-27ef-46c5-a0ef-c98b3aa84484', '686b746b-b3cf-46b7-8a7c-c2698d55cfab']","['feal-differential-cryptanalysis__aXJxxbc', 'feal-differential-cryptanalysis__V9UUVVh', 'feal-differential-cryptanalysis__dkXMQeg', 'feal-differential-cryptanalysis__mBNgd7n', 'feal-differential-cryptanalysis__xZScwiA']",0,"[263.713261, 149.303963, 472.351033, 165.958678, 148.443599]","[247.146887, 13.639101, 22.398372, 129.985055, 280.296664]",0.0,False,[] +grok-code-fast-1,feal-linear-cryptanalysis,5,"['70a1c023-8126-49a3-938d-7cea810588fe', '6e12f3dc-1378-4e86-992d-8dfad8ef555b', '8e09137e-fff0-4cf0-aec0-9f4d90e08748', '2c1a6033-8906-48c7-9701-78aa1714f30a', 'c7ab5712-aff6-4792-8105-3358b797720b']","['feal-linear-cryptanalysis__riu4Qtn', 'feal-linear-cryptanalysis__fAL6HSb', 'feal-linear-cryptanalysis__8ZM9GLK', 'feal-linear-cryptanalysis__QUdXgSW', 'feal-linear-cryptanalysis__t6BoJ2f']",0,"[631.881206, 307.19413, 900.854049, 777.650423, 625.302822]","[85.889226, 68.515434, 157.087235, 20.730748, 56.668543]",0.0,False,[] +grok-code-fast-1,filter-js-from-html,5,"['472c5afe-743c-4eb6-be36-eb3e2b1bccb6', 'f5283f4b-8974-43f7-a40c-ee5fa96ec462', '57bc73e1-df70-46eb-8427-ba59efd4b9af', '429e99de-f645-44c4-bb74-feded6c11639', '7a484c9e-f117-43f9-b0fd-1382ee75bc04']","['filter-js-from-html__3JYsWLo', 'filter-js-from-html__Eiaye9o', 'filter-js-from-html__iefbViY', 'filter-js-from-html__eQGGUqx', 'filter-js-from-html__StFnzHF']",0,"[39.359657, 68.472217, 367.982357, 32.701211, 35.77445]","[51.823047, 54.297497, 115.986212, 35.584127, 48.503849]",0.0,False,[] +grok-code-fast-1,financial-document-processor,5,"['5cc908a0-b8b0-4596-883e-30344ce209a9', '1d2345d6-e057-4f24-8e65-8790edce7774', 'c2ccdb5e-8a42-4a1a-9708-4511877bc04b', 'a8f215e1-ed86-4396-9cf3-220dedb14464', 'b5792fa5-773f-4f70-bb74-19e2997a75e1']","['financial-document-processor__Lg8RXAL', 'financial-document-processor__ySsbio4', 'financial-document-processor__hrCndGK', 'financial-document-processor__6MgYupR', 'financial-document-processor__MKSskp8']",0,"[328.287738, 331.041978, 295.970427, 87.683204, 83.73838]","[29.720705, 117.631737, 25.564601, 116.056699, 235.874611]",0.0,False,[] +grok-code-fast-1,fix-code-vulnerability,5,"['17da5b2b-eb9f-487b-b725-fe379680d6b1', 'aa63a451-665d-4dd6-84f0-17468df2227d', 'e64fccba-96bb-40ba-ace7-289de375f3a4', 'f73ca943-2986-4039-bf97-bfa98b99fc0c', 'be90131b-91f0-4804-98ca-13cd5b1f869e']","['fix-code-vulnerability__fDAUreJ', 'fix-code-vulnerability__7JQkjZn', 'fix-code-vulnerability__sGbrxH8', 'fix-code-vulnerability__SgWcUMV', 'fix-code-vulnerability__P3dMhFe']",0,"[165.510629, 900.071085, 344.88578, 928.578719, 367.197265]","[41.021836, 76.192144, 12.833966, 5.249803, 58.161604]",0.0,False,[] +grok-code-fast-1,fix-git,5,"['623a966d-53ac-450c-96d8-8d84204ff3aa', 'eadedfe7-471b-4113-b853-13d373ac303a', '5fe15e49-cfc2-4b14-ba17-7e3b5f2df5a3', 'd3738041-2571-4869-8f9b-d0c6b483f30e', '967301e6-a3da-4932-97db-329020ce7f6e']","['fix-git__TVJghgU', 'fix-git__uu7Y4xE', 'fix-git__6QYTpfC', 'fix-git__Vp26XUc', 'fix-git__4XRtuty']",1,"[82.770473, 199.538043, 852.275154, 369.801683, 260.749011]","[40.610128, 45.264456, 64.474199, 31.06923, 72.387543]",0.2,False,['967301e6-a3da-4932-97db-329020ce7f6e'] +grok-code-fast-1,fix-ocaml-gc,5,"['12d2ff45-5d78-4e93-ae43-67d218550b9a', '6cba3f53-e365-4a02-90fb-79517d752af0', '5bfbcca6-221a-437e-81d2-7d00604f661d', '3ccd2fb7-1823-4cd0-ae9e-4154268de659', '7c56abc1-3133-4715-80bf-bc250963e9cd']","['fix-ocaml-gc__fVBjN92', 'fix-ocaml-gc__vvvChLd', 'fix-ocaml-gc__otoJCTw', 'fix-ocaml-gc__PYxSegE', 'fix-ocaml-gc__ibrjE3K']",0,"[475.455921, 1485.734256, 2073.222343, 798.084791, 1973.564711]","[33.385878, 119.519931, 14.035893, 47.671563, 60.397591]",0.0,False,[] +grok-code-fast-1,form-filling,5,"['09daf0a3-0be2-4108-84ba-73ed4c8b262e', 'a8203cf0-f2d6-4f59-91da-80b8b0c3076d', 'ef80d46c-70a9-4a33-a02f-15c011616e29', 'dcec8655-8344-45ff-ae61-00efa79f4234', '6744f165-9919-4ba8-a04c-bddfd0fc46c2']","['form-filling__vod655M', 'form-filling__ubLwFEF', 'form-filling__8MVGjoL', 'form-filling__NxAkW2t', 'form-filling__6BHUB2Z']",3,"[326.551391, 310.594237, 204.388012, 86.797682, 118.443591]","[22.707979, 37.428633, 4.775181, 9.406561, 8.454541]",0.6,True,"['09daf0a3-0be2-4108-84ba-73ed4c8b262e', 'a8203cf0-f2d6-4f59-91da-80b8b0c3076d', '6744f165-9919-4ba8-a04c-bddfd0fc46c2']" +grok-code-fast-1,git-leak-recovery,5,"['8af4b9ac-dcda-4bf0-aff9-b13947a9ee5c', '03e75e83-d09e-4936-a970-f869509dae21', '2ef18b10-d2a9-4857-8d63-f3e631024650', 'bc56cbdc-25b6-4c67-ae2d-711c9dab8f69', '25bcc30c-935b-4b86-afde-8f6751dfdaf1']","['git-leak-recovery__SthcHDf', 'git-leak-recovery__zUNwwHe', 'git-leak-recovery__G92qo8P', 'git-leak-recovery__CdPfdHt', 'git-leak-recovery__vRxx8Mr']",1,"[123.645644, 77.518181, 290.527972, 35.950961, 214.798702]","[29.369933, 58.866277, 27.897707, 16.669902, 40.99536]",0.2,False,['8af4b9ac-dcda-4bf0-aff9-b13947a9ee5c'] +grok-code-fast-1,gpt2-codegolf,5,"['4657c8d9-2d07-41fb-a682-0077dd737d78', '1fc5b8b3-54fb-4b1a-b003-1fb04ad2826c', '32f6148f-d383-401c-873e-bca2ba8a7afe', 'f3bee811-1337-40bc-b1bc-7ed8088e56ec', '7ab19ed0-bdc0-422b-88a2-03931ee7ff8d']","['gpt2-codegolf__rX8eJYK', 'gpt2-codegolf__2aAJgXX', 'gpt2-codegolf__WAnZNuf', 'gpt2-codegolf__krGU8Cz', 'gpt2-codegolf__Usu27kV']",0,"[44.607847, 69.75182, 159.615188, 34.891083, 47.196831]","[17.499327, 188.319716, 76.525794, 23.985259, 69.804333]",0.0,False,[] +grok-code-fast-1,hf-model-inference,5,"['a84efdf1-6156-4caa-b18e-69f177573f3e', 'f8204e16-9b97-4616-a709-4c978e18f931', '150b4736-4bf4-4e87-826c-154a6b2cdfd2', '856b9854-86c6-45a4-aa4f-0c31c512e1a8', '3d48106b-4428-4b61-8344-5cfbb1654b17']","['hf-model-inference__27P9pgE', 'hf-model-inference__BfXdgLZ', 'hf-model-inference__KT57uou', 'hf-model-inference__sVuy2GR', 'hf-model-inference__fj5N9dV']",2,"[212.010365, 84.616999, 134.600098, 152.852531, 85.622256]","[13.145887, 53.874307, 63.497582, 25.552186, 38.822705]",0.4,False,"['150b4736-4bf4-4e87-826c-154a6b2cdfd2', '856b9854-86c6-45a4-aa4f-0c31c512e1a8']" +grok-code-fast-1,install-klee-minimal,5,"['d7e84b9c-fb8d-4bd9-8792-5ba94104bba4', 'af94516c-8e30-433b-9281-2445048c3173', 'fee2e9ad-5aee-4cd4-894b-26e071c71c93', '40f175e0-41c0-4ece-bd2d-c362337fe1a1', '7bc53f63-700f-4bfa-a688-d925ebbc9e6a']","['install-klee-minimal__ScmoRkq', 'install-klee-minimal__mTnr9t5', 'install-klee-minimal__gBdKoTf', 'install-klee-minimal__CjW88t8', 'install-klee-minimal__r4eyFig']",0,"[908.998116, 900.001959, 479.099412, 900.032245, 900.470523]","[38.50816, 37.562041, 201.783139, 65.061338, 164.763999]",0.0,False,[] +grok-code-fast-1,install-windows-3.11,5,"['f1ed4354-e3be-4398-b2f4-5651da591e36', '8dd02d32-814e-478d-a0d2-b0c821c6f2ec', '908fd45f-ef96-49cb-9c88-7514f3f59e98', 'ebfc759b-138b-41f5-922f-7599feafce91', 'e88e3d91-35af-425a-b81a-9f6d4a6c662a']","['install-windows-3.11__ETXE5xq', 'install-windows-3.11__fQbhKwk', 'install-windows-3.11__E6inXGi', 'install-windows-3.11__QvEiKbZ', 'install-windows-3.11__h2LddXB']",0,"[320.577613, 1112.760538, 222.356272, 852.042047, 194.912933]","[32.864253, 21.970175, 32.162685, 69.223883, 43.458608]",0.0,False,[] +grok-code-fast-1,large-scale-text-editing,5,"['6634cdb8-cbb3-4206-aa65-6b897fdb6bb2', 'dc4a31c6-85a4-44cc-83ed-69c1cb29de6e', '0cd89299-0805-434f-b281-fb01f768a7e6', 'b2c829d1-b88a-413d-a414-3066eef23534', 'd372fa99-92ec-40e8-91ae-24a4d9357550']","['large-scale-text-editing__rqaxwqH', 'large-scale-text-editing__f3CSJqx', 'large-scale-text-editing__vjTHPYx', 'large-scale-text-editing__fcDW6Cs', 'large-scale-text-editing__CibJ79L']",0,"[106.596472, 208.982002, 558.664554, 161.207289, 120.093058]","[97.132019, 198.787418, 22.626006, 321.218731, 34.339629]",0.0,False,[] +grok-code-fast-1,largest-eigenval,5,"['b3750943-d6ab-41d7-a756-aa7997b84b1c', '73334acf-c2d6-4d74-9cd5-1df50690103d', 'ec706b11-1e87-48ba-93aa-72ab7fb00467', 'bac75088-6e38-43cd-a256-4f5065278f7c', '2fda543a-55ec-4299-9fd9-6d6e8cb68c09']","['largest-eigenval__KqHd7yW', 'largest-eigenval__VUHKnox', 'largest-eigenval__G2giYc5', 'largest-eigenval__2nVETQN', 'largest-eigenval__XhsjPNH']",0,"[905.303051, 908.582583, 900.198927, 761.680012, 949.914758]","[144.500379, 58.150473, 145.521429, 143.937369, 40.645924]",0.0,False,[] +grok-code-fast-1,log-summary-date-ranges,5,"['5faa7bb1-2260-4e2f-907c-9f5311f64452', '1eedae27-bd40-4e49-a7ea-7e53f3ea2559', '77cfe204-6dfc-493b-b593-19f9bf76f5ad', 'dc9c0b1f-74a0-49e0-83b2-94fcfcc437b1', '31e167bc-8931-46b2-bd3d-302b2a65d47d']","['log-summary-date-ranges__5GBM5gL', 'log-summary-date-ranges__N3NNfvh', 'log-summary-date-ranges__rjEouY2', 'log-summary-date-ranges__yneFe2a', 'log-summary-date-ranges__GEqfxeH']",0,"[166.377165, 135.948771, 96.015003, 192.412587, 44.254706]","[92.618758, 77.463873, 13.724075, 57.902655, 158.220855]",0.0,False,[] +grok-code-fast-1,make-doom-for-mips,5,"['066fbfe6-f59c-4fc4-8e3f-41da24ca2026', 'e9cf0f4f-85fe-42ac-903a-6230bf4cc8ce', '44db6da9-f3f8-4344-88af-74627abe5796', 'e6f23cad-9881-4526-9dd7-9b907bbe37fb', '2adc6d64-018c-4698-a43f-d221ba4ba398']","['make-doom-for-mips__L3HQKAh', 'make-doom-for-mips__iVQtiSq', 'make-doom-for-mips__BgvMW2N', 'make-doom-for-mips__Fbodpkc', 'make-doom-for-mips__LCRzGER']",0,"[578.118148, 636.112899, 739.340836, 589.842526, 900.568042]","[78.704034, 48.239759, 22.976898, 31.865569, 168.414001]",0.0,False,[] +grok-code-fast-1,make-mips-interpreter,5,"['d3b1b785-6b03-48cb-a2d0-ebe693ff184c', 'cb02b4ad-c656-434a-a32f-fca3e475be87', 'f0437214-8b1f-42bd-86cf-480e9fad0f7c', '0e5258c5-aa4f-43d2-bb3c-8e7fa1764fa6', 'cb552c04-f6df-416e-b20c-da69d7ee8d92']","['make-mips-interpreter__Vsj2kGZ', 'make-mips-interpreter__vWagHDZ', 'make-mips-interpreter__SPJ6Nwd', 'make-mips-interpreter__wwHdzwk', 'make-mips-interpreter__WUrTvVQ']",0,"[508.010753, 783.100446, 613.110449, 1153.781232, 1453.991861]","[11.209851, 128.378765, 81.096021, 71.816935, 114.94954]",0.0,False,[] +grok-code-fast-1,merge-diff-arc-agi-task,5,"['2480e1e3-7d49-4248-bd01-2e4c90947e6b', 'c40c8646-7196-4bc4-a2fc-e6f1f067b0f6', 'd66b8d7e-a5be-4a25-8167-317f2024d192', '75fb856c-4ce4-46fa-b750-a34deefde633', '2d198eab-ffa2-4c5e-acdb-dd520cfe1b59']","['merge-diff-arc-agi-task__EZMUXfo', 'merge-diff-arc-agi-task__gJLEfN5', 'merge-diff-arc-agi-task__ybYNrax', 'merge-diff-arc-agi-task__c5evLy9', 'merge-diff-arc-agi-task__ZSmVnqf']",4,"[801.21029, 282.980675, 910.407648, 845.071644, 223.598911]","[160.427972, 32.247063, 53.290013, 144.315513, 25.15241]",0.8,True,"['2480e1e3-7d49-4248-bd01-2e4c90947e6b', 'c40c8646-7196-4bc4-a2fc-e6f1f067b0f6', '75fb856c-4ce4-46fa-b750-a34deefde633', '2d198eab-ffa2-4c5e-acdb-dd520cfe1b59']" +grok-code-fast-1,model-extraction-relu-logits,5,"['d31531be-74a4-41fe-8d73-2d6d2065482c', '58a2576f-8aa4-4715-b8cd-4d83f86390aa', '092edccd-2bd3-4795-9f3b-33370ee33590', '9bd3fbac-ab22-40f5-8afc-def6c2749c08', '60a2ba2a-a896-44a3-ae5c-297d8c437384']","['model-extraction-relu-logits__um5Q3Ef', 'model-extraction-relu-logits__MQbe7a5', 'model-extraction-relu-logits__MvKbEGo', 'model-extraction-relu-logits__32zbfFo', 'model-extraction-relu-logits__cjyARw7']",0,"[151.89274, 86.930158, 79.757427, 174.07949, 89.033644]","[98.507522, 25.215929, 37.881344, 57.551458, 15.639714]",0.0,False,[] +grok-code-fast-1,mteb-leaderboard,5,"['582dab3e-c249-4c08-9d3c-bfbf064a057c', '029e4ac6-be71-436e-b58b-681bec0d33f1', 'ce6b390c-9cb0-43e2-a581-b7cd2f8ef136', 'c4ff7377-67a7-4fb4-b2c9-5710a2048d31', '9c414b15-610b-41f7-bc57-909a6025a9eb']","['mteb-leaderboard__S5eUe5g', 'mteb-leaderboard__TQVqCe3', 'mteb-leaderboard__YiEixqB', 'mteb-leaderboard__SB3hpwd', 'mteb-leaderboard__Dmi6NaE']",0,"[146.267777, 54.017572, 334.936862, 368.17852, 89.786656]","[32.577891, 2.79326, 4.332947, 10.908966, 52.704828]",0.0,False,[] +grok-code-fast-1,mteb-retrieve,5,"['b15502e6-690f-4df9-8953-ab33fa8268ca', 'a02f0adf-75cb-4835-9ebe-6ca02233115a', 'c8c4f4fd-d5d2-4a2f-bd20-4dd7fe3c1969', '802f94ac-5233-475f-af91-e7ca67833fd4', '979d7f90-e29a-4f5f-ae4f-4388beb6dcad']","['mteb-retrieve__Hg3bVTM', 'mteb-retrieve__cGndWAk', 'mteb-retrieve__GiRCTFJ', 'mteb-retrieve__HnUKmWc', 'mteb-retrieve__35eQy5A']",0,"[210.914319, 217.240875, 139.967001, 80.889906, 52.264941]","[11.973209, 75.617327, 125.46929, 36.444527, 5.659716]",0.0,False,[] +grok-code-fast-1,nginx-request-logging,5,"['d8520981-e0c1-43c5-9d82-cd2d002215b5', '3e08f3b9-29d6-4997-bdd6-d714f8637602', '24472457-f34e-4074-aa41-aa33fd178913', '394497fa-7998-425e-ba88-32f7cae9bafc', '539e5175-7ae0-4359-b135-698e97ce318b']","['nginx-request-logging__ADx6sKY', 'nginx-request-logging__38QcyAD', 'nginx-request-logging__Ft9eR5f', 'nginx-request-logging__hcNQ5QH', 'nginx-request-logging__JTzDyAK']",0,"[78.433008, 78.482906, 135.602007, 349.288517, 195.755936]","[33.784945, 56.24269, 33.581425, 37.610568, 155.836368]",0.0,False,[] +grok-code-fast-1,openssl-selfsigned-cert,5,"['35c29313-afc7-4511-abe8-13b9c9177d42', 'e455b5b4-27c3-454a-8206-c014fe952981', '60fe1148-64b9-482d-ba72-28b100ebf8ea', '32e2e69d-dc92-4a8b-9a81-a4c0b704b038', '840db8a2-7621-4e12-937e-e4955c0d5a59']","['openssl-selfsigned-cert__pQH6oRN', 'openssl-selfsigned-cert__s8aMnou', 'openssl-selfsigned-cert__bwYigmV', 'openssl-selfsigned-cert__Ht74iSF', 'openssl-selfsigned-cert__7cFPebL']",1,"[71.394297, 31.139507, 82.783771, 42.709974, 259.329827]","[53.053476, 27.0038, 70.168426, 46.940504, 47.773657]",0.2,False,['840db8a2-7621-4e12-937e-e4955c0d5a59'] +grok-code-fast-1,password-recovery,5,"['a081fdee-435a-4ded-860c-52600dee3e96', '79b54340-e4c9-474d-ac59-d3058685795c', '96a1eea1-5dbb-4812-88d3-ad61d306e395', '5a8c6cab-5d2b-4a51-9459-61dc03cd3c1f', '6896217d-dd24-4978-a10d-38b55a37fd4f']","['password-recovery__kwwMGiS', 'password-recovery__ZyqTC4o', 'password-recovery__mBzucVN', 'password-recovery__76QX5cf', 'password-recovery__JM38hz7']",0,"[725.064546, 166.469868, 1546.922871, 393.118825, 274.347955]","[41.072304, 24.798839, 140.937181, 31.106724, 38.970658]",0.0,False,[] +grok-code-fast-1,path-tracing,5,"['7dd3ba78-b646-4866-9d33-eb328d23c223', '83ffc759-3c9a-425b-8702-d5ea5fb6e06e', 'ee448201-b409-4db9-b531-7e4362d0bcfc', 'eb2121a9-fbec-469f-8ce0-0747a2c8bb2a', '136ae080-81a7-401e-9e66-8b9df4b662ed']","['path-tracing__R3RfvUm', 'path-tracing__FVfLLsk', 'path-tracing__CVmwzfs', 'path-tracing__WpjQGKe', 'path-tracing__GgdokGX']",0,"[353.434563, 900.052758, 468.402407, 104.654786, 864.613321]","[60.521827, 269.240398, 24.392706, 32.117459, 15.256814]",0.0,False,[] +grok-code-fast-1,path-tracing-reverse,5,"['e2cc6cfd-8a05-4d21-9a29-6101193986cb', '1ab319e5-6efb-4e51-8a4a-b6322ed9e0ed', '6bade9a9-4f4d-4a4c-9f47-b3ac7e6a0601', '662b1d6c-0152-4e79-825b-7abfc4602495', '0da7b865-1d9c-4053-b255-4dd77faa2e1c']","['path-tracing-reverse__JRmxAjE', 'path-tracing-reverse__HMmx24w', 'path-tracing-reverse__k5aKe2E', 'path-tracing-reverse__s8hFhZT', 'path-tracing-reverse__azjPixm']",0,"[778.868283, 317.714265, 855.003376, 187.353112, 210.562781]","[69.254919, 55.157044, 37.436767, 81.741657, 58.631387]",0.0,False,[] +grok-code-fast-1,polyglot-c-py,5,"['b9edcdc2-de44-4cfd-9c9f-f591c72ab802', 'f8ba3417-ba0e-4b06-8874-24f5f2e04043', '26610c59-e092-4e30-8263-2d73408b077c', '0f3bb954-0af3-4922-9dc1-be22bedeb80f', '4cda2590-856b-47f4-a88e-1709f0041087']","['polyglot-c-py__Dud6jbP', 'polyglot-c-py__gR4GEdP', 'polyglot-c-py__2nGhSwq', 'polyglot-c-py__nReBwUp', 'polyglot-c-py__b3XBzG8']",0,"[428.017157, 80.655392, 900.001487, 902.576206, 156.504425]","[22.782548, 17.220867, 42.306265, 33.091535, 32.069459]",0.0,False,[] +grok-code-fast-1,polyglot-rust-c,5,"['1a575449-6f93-48c1-873e-235602f611d3', '062ca169-0225-4aef-9012-6eeeac6c0327', 'cd462294-8aa2-4141-9b82-2b07a1034ed0', '8e1c3119-8c53-4383-a134-0eed538f5368', '19613bb6-a28e-40d7-bfdf-d90252c276bc']","['polyglot-rust-c__FkJoekS', 'polyglot-rust-c__V8FJoGP', 'polyglot-rust-c__3iRYz4y', 'polyglot-rust-c__6UuRJsK', 'polyglot-rust-c__2Ad5qPi']",0,"[143.00186, 134.266409, 276.300903, 60.939518, 134.311927]","[12.201226, 69.087899, 95.752038, 89.225538, 68.489134]",0.0,False,[] +grok-code-fast-1,port-compressor,5,"['2494010e-6cf2-4388-87b8-5a164f6fa909', 'b1100d68-0e07-496b-9cdb-615c581a86e5', 'ece02cc6-a3c5-4969-a7d3-b85ffc7f7368', '283d25bc-2e79-4301-840e-698575cec4e6', '57c092f6-9f79-45c6-a4a0-caa7c8e4657c']","['port-compressor__MQCdgdT', 'port-compressor__RkSAC8A', 'port-compressor__BVnRqmH', 'port-compressor__os3RZbi', 'port-compressor__5tG72EF']",0,"[3600.001048, 1578.648033, 1316.031081, 1162.637823, 1707.588556]","[97.684289, 105.25655, 19.012168, 36.285625, 142.310989]",0.0,False,[] +grok-code-fast-1,prove-plus-comm,5,"['e59958ca-45a7-49c9-aae9-400727717c94', 'f1ab02d9-2e8f-4016-9adb-a0aa62fe91f5', 'b14de3d6-fff4-4d05-a26f-e81a3eb314b4', '0fb02eae-38a9-4240-8a87-a5e4280652c5', 'd1e0c755-7e0b-4d11-85fc-37ea68f7fb90']","['prove-plus-comm__rStLf56', 'prove-plus-comm__ta8FryR', 'prove-plus-comm__kdc9yko', 'prove-plus-comm__jmRgFVg', 'prove-plus-comm__HfdM38n']",2,"[120.692465, 871.183531, 93.848716, 179.639355, 223.013114]","[46.770471, 26.018969, 42.003955, 86.931802, 134.079652]",0.4,False,"['b14de3d6-fff4-4d05-a26f-e81a3eb314b4', 'd1e0c755-7e0b-4d11-85fc-37ea68f7fb90']" +grok-code-fast-1,pypi-server,5,"['6ffea995-64ee-40bf-acfe-eef9119779a7', '7f85acbc-0f96-41c0-bbd7-1c79c3bdef0e', '9ecda2b6-6eb7-4bf9-a9d8-a6a96685873d', '43db5e39-7beb-404e-ad93-1ceda10aa853', '63248a7f-4a6c-4896-a9e5-7a7478ad32a9']","['pypi-server__xHaA4s8', 'pypi-server__h2boM2W', 'pypi-server__M7XmVZA', 'pypi-server__kWb8CVj', 'pypi-server__NmV84sb']",4,"[164.824983, 358.658308, 220.468185, 99.855592, 118.283497]","[36.256824, 101.3869, 48.472387, 117.31453, 14.320815]",0.8,True,"['6ffea995-64ee-40bf-acfe-eef9119779a7', '7f85acbc-0f96-41c0-bbd7-1c79c3bdef0e', '9ecda2b6-6eb7-4bf9-a9d8-a6a96685873d', '63248a7f-4a6c-4896-a9e5-7a7478ad32a9']" +grok-code-fast-1,pytorch-model-cli,5,"['6e41832a-5685-48bb-abaf-6c677ff659a6', 'a71688f3-d6ed-45dd-a6ac-e7d58162c60b', '1d6e26a9-bf0f-413d-ab38-9145a37eb8a8', 'acac0e33-8058-4f0e-8df6-8d3a509615cb', 'dac5886f-b7af-45b5-add6-b14513335287']","['pytorch-model-cli__oYptmN7', 'pytorch-model-cli__qHerKsZ', 'pytorch-model-cli__d4jQUDh', 'pytorch-model-cli__L96SLGq', 'pytorch-model-cli__2hrb8tj']",0,"[195.916782, 255.958622, 158.553553, 751.040226, 41.815983]","[83.184178, 142.35297, 85.360047, 72.756542, 95.539356]",0.0,False,[] +grok-code-fast-1,pytorch-model-recovery,5,"['5f47255a-e9ee-4db6-aced-a38e5ed437f6', 'd9153ded-2d0e-4aee-9922-933e6d6a59df', '5a72c8fa-0b3d-49ea-a9e3-945ac438d359', 'e95c6568-e2af-4706-af63-cf3299e21537', '71a69a77-ee48-4a65-b36b-4eeecf36c854']","['pytorch-model-recovery__BbRT9QX', 'pytorch-model-recovery__LATuwEk', 'pytorch-model-recovery__x9Zdc8z', 'pytorch-model-recovery__Ptg7DfN', 'pytorch-model-recovery__vEwEyvP']",4,"[388.586555, 165.028589, 751.082771, 210.826855, 907.022388]","[106.89135, 13.397015, 127.342524, 70.426528, 83.280276]",0.8,True,"['5f47255a-e9ee-4db6-aced-a38e5ed437f6', 'd9153ded-2d0e-4aee-9922-933e6d6a59df', '5a72c8fa-0b3d-49ea-a9e3-945ac438d359', 'e95c6568-e2af-4706-af63-cf3299e21537']" +grok-code-fast-1,qemu-alpine-ssh,5,"['346b266b-605c-4111-9355-09cb07bcb186', '498db6da-5bf1-43c2-9e3c-dad13471a78b', '13f6237b-93f8-40d3-a761-a1a272cc7eb2', '7ae7750e-4596-4b03-991b-a81632e6236f', 'b4ccc014-d359-43a0-bcfb-87db022f74d2']","['qemu-alpine-ssh__v4GJqdK', 'qemu-alpine-ssh__u8i2NtJ', 'qemu-alpine-ssh__rxHyTrJ', 'qemu-alpine-ssh__ScRQhGZ', 'qemu-alpine-ssh__GofMgPu']",0,"[169.544178, 126.480546, 438.084797, 613.068757, 224.318987]","[10.354197, 4.915091, 17.978124, 10.094561, 77.538749]",0.0,False,[] +grok-code-fast-1,qemu-startup,5,"['243c8c84-4993-4366-bc85-2760a725db0b', '342a6d2b-e1d9-429a-adf3-5c1287115a2c', '35888e4c-8afd-4d05-b235-7304a4b4ccce', 'baaec447-920a-48d3-8def-6d7e74554e17', '25041241-7c70-4d3b-88df-9a4fd0b2f253']","['qemu-startup__qn5mAoR', 'qemu-startup__PL4PuGv', 'qemu-startup__VzbLuTP', 'qemu-startup__GkCkBw2', 'qemu-startup__PEHZHBr']",0,"[214.288405, 134.143608, 502.770008, 77.342413, 110.70126]","[3.125929, 7.345084, 105.587193, 47.870168, 24.247513]",0.0,False,[] +grok-code-fast-1,regex-log,5,"['48faaa54-371a-4539-aa39-cbf013c15275', 'f6444afd-b425-49c9-a9b0-fa3b8ef2211c', '715fe238-1426-430a-a999-ebb63323271c', 'ef1f5c77-2c51-43d9-8967-865f54feabfb', 'a5625fff-9862-41ac-a2a3-7f0420fce703']","['regex-log__4962xam', 'regex-log__T4nXA3n', 'regex-log__n7unog9', 'regex-log__tsqiHxu', 'regex-log__VcydWAx']",0,"[78.786385, 113.024727, 53.534082, 54.823073, 72.708507]","[132.412973, 42.891422, 154.52592, 180.47473, 251.216783]",0.0,False,[] +grok-code-fast-1,reshard-c4-data,5,"['d7f9cdc8-9a63-489b-9a66-ff574eba5cb2', '51e5b942-8cac-49cc-a3b4-de1d565c6078', 'b8c6dc20-6abe-424a-9e90-9c479900ef23', '5cf8df3c-1403-4ada-bc71-535d42b2fd24', '2d148477-4c94-433f-acc4-13465f7906f0']","['reshard-c4-data__oLQAh3Z', 'reshard-c4-data__xua5YLF', 'reshard-c4-data__PTphgPY', 'reshard-c4-data__zAHXPEf', 'reshard-c4-data__rykk7Xs']",0,"[1012.044011, 209.462943, 228.425349, 426.803332, 152.232057]","[199.325842, 101.970378, 18.459695, 112.318368, 44.333447]",0.0,False,[] +grok-code-fast-1,reverse-engineering,5,"['af7fd4f3-e0ce-41f6-a564-8d9fc25b5adf', 'fb0bcbd7-f53d-47f1-b5d1-2b3c22ec8ba6', '70a666d1-0963-4c10-a6c3-291b59275f5b', '9ddb82b5-7d3a-409a-a40a-7fa36fb80648', '810dfa21-fb91-47e0-8a7a-12bbd39d4469']","['reverse-engineering__jK7gaks', 'reverse-engineering__6dtJEz7', 'reverse-engineering__yFKtugg', 'reverse-engineering__gkcJygp', 'reverse-engineering__EXCvXVN']",0,"[1829.960162, 773.107443, 567.980075, 751.386512, 560.183296]","[81.651312, 9.500349, 44.186821, 72.161544, 28.131895]",0.0,False,[] +grok-code-fast-1,run-pdp11-code,5,"['c026bb4f-9718-431e-80f8-a2a9705c6356', '0a4ae6e3-6cce-4e26-ab2d-5287e007dc31', 'e6bca75e-550b-4a78-ad5a-9753313964bc', '413c3716-d159-4468-9946-22a68b37ec0e', '6f88e697-5e8b-4aa2-b1d6-a977771d3126']","['run-pdp11-code__SEUBYxT', 'run-pdp11-code__3N3jjtt', 'run-pdp11-code__xGY39X2', 'run-pdp11-code__RSDY3ch', 'run-pdp11-code__DXpeFNV']",0,"[289.745059, 778.566592, 168.64466, 175.930435, 210.61015]","[79.636708, 306.307621, 26.190271, 24.59088, 26.316498]",0.0,False,[] +grok-code-fast-1,sanitize-git-repo,5,"['d4a9c83e-4eca-4b21-8064-0d0bedec6413', '6664bb92-73d1-4c85-9296-9136052280df', 'f48e2d60-d9d0-404d-b7f0-3052388fac36', '47ac79e5-9e41-4f58-8750-d1c8f2502dec', '9f350085-b024-4dc9-879e-d1de26480524']","['sanitize-git-repo__acxSy88', 'sanitize-git-repo__oQskLDN', 'sanitize-git-repo__axv2mT9', 'sanitize-git-repo__rcJgMzp', 'sanitize-git-repo__cMMWcsA']",0,"[143.342077, 233.533343, 728.772342, 93.022018, 277.016566]","[33.037833, 149.035607, 99.328056, 33.636933, 45.862659]",0.0,False,[] +grok-code-fast-1,schemelike-metacircular-eval,5,"['fd6ad47b-0939-4d6a-bbea-35fdf880f3ac', '78ef4ba7-9fd2-44ee-9005-86543b3934b4', '0ec75d07-c134-446a-bb5f-3f5c4422bce9', '85726105-f0d0-4bac-8949-7239a5c34eb2', '04359fed-7181-4358-9bc1-c287cb91ea2e']","['schemelike-metacircular-eval__SjSS6aU', 'schemelike-metacircular-eval__pRAxkte', 'schemelike-metacircular-eval__JdMuaZv', 'schemelike-metacircular-eval__JQXgUZq', 'schemelike-metacircular-eval__fNoAW3b']",0,"[1060.356559, 414.705353, 81.237479, 85.881396, 2458.884372]","[42.638463, 84.515927, 99.664492, 43.812574, 92.10386]",0.0,False,[] +grok-code-fast-1,sparql-university,5,"['cd84fb75-892a-4d65-9084-02c337b9a4e2', 'fa4d063d-1cbc-44d5-8840-fcf35d6accd9', '804f2b10-35f8-4b12-b73f-8efbb05db0be', 'b909de70-bc0e-44e2-8c7b-3cc1673d095b', 'a5bb7d2d-09d8-47ad-a00c-aca600518a72']","['sparql-university__fX7Crmg', 'sparql-university__uuD8a5j', 'sparql-university__AoXHXFs', 'sparql-university__nhp5oiU', 'sparql-university__DCUpf9p']",1,"[84.458351, 142.972353, 415.611983, 66.73889, 90.451081]","[28.367752, 27.781508, 197.733908, 35.879157, 55.308732]",0.2,False,['cd84fb75-892a-4d65-9084-02c337b9a4e2'] +grok-code-fast-1,sqlite-db-truncate,5,"['15e42ae0-356b-4c05-a50d-28cbc6ae135f', '0db97972-77d7-4a28-86e6-8e25753e54ba', 'a520c6b7-3bab-40ca-9113-e1bbef7cff5e', 'aa3d5da6-d0f9-4282-98fb-85558f318e93', '0ea95bbc-03c8-4b6f-880a-5ce18bbf2ef3']","['sqlite-db-truncate__eXMvwGf', 'sqlite-db-truncate__ZyxJSEH', 'sqlite-db-truncate__xh4ppUz', 'sqlite-db-truncate__wQtTszm', 'sqlite-db-truncate__bfWwMqp']",0,"[481.14695, 700.449719, 237.207365, 206.492458, 607.749307]","[65.48571, 14.371443, 23.665818, 57.338102, 34.468542]",0.0,False,[] +grok-code-fast-1,sqlite-with-gcov,5,"['8c798de3-08e7-4311-bb2b-40e93f54be4a', 'a84d82d0-060b-4cfc-98bb-a36b1399d47a', 'b52b4b85-cbb6-409e-a3c6-ad272651857e', '8891155c-f9c4-4757-a04c-60be19301407', 'a4617cbf-b644-41e7-be2b-004a9c17e855']","['sqlite-with-gcov__SZeEhaU', 'sqlite-with-gcov__vNpoYTF', 'sqlite-with-gcov__CYReqWN', 'sqlite-with-gcov__H5eSA6W', 'sqlite-with-gcov__zS32SoJ']",1,"[205.526773, 159.549124, 529.545409, 190.95286, 414.154419]","[36.043147, 36.846421, 83.659679, 69.78673, 27.733161]",0.2,False,['a4617cbf-b644-41e7-be2b-004a9c17e855'] +grok-code-fast-1,torch-tensor-parallelism,5,"['55641752-0e34-44cf-8868-77b2a4ab1435', '06447302-968f-42dd-be7d-d3cbbd38f453', 'a70f0bc6-fbba-4caf-beb7-a10780391adb', 'ee4465a5-b328-43ba-bbb5-d91594eb5a21', '41c9e386-6900-4781-920c-94c2020fd902']","['torch-tensor-parallelism__YK6DPX4', 'torch-tensor-parallelism__icBZeJs', 'torch-tensor-parallelism__rBSjdGb', 'torch-tensor-parallelism__q84SCdJ', 'torch-tensor-parallelism__bk4yzNS']",0,"[53.174904, 12.953862, 48.794551, 49.039392, 66.318464]","[23.148643, 33.516358, 21.408038, 59.980978, 38.260453]",0.0,False,[] +grok-code-fast-1,train-fasttext,5,"['d67b5259-a4f2-495a-9a12-2e569af745e7', 'bcbd87dd-589f-46bd-a450-30995fb92c16', '10aaf009-27a2-4b61-9eb8-c1516b7b8bf0', 'efadf707-8168-4c10-94b3-b2a8c5125c4e', '3010fdc0-0b0a-44c3-9a14-b853a4b54786']","['train-fasttext__uLfzFCu', 'train-fasttext__AitcabQ', 'train-fasttext__CbpBocY', 'train-fasttext__iojb2oJ', 'train-fasttext__zEU6Bjx']",0,"[2912.105278, 1730.768589, 1162.404317, 2080.614079, 864.854779]","[27.403714, 19.920611, 20.62422, 34.431525, 77.129057]",0.0,False,[] +grok-code-fast-1,tune-mjcf,5,"['d1d93f71-5f04-4bae-85c4-47e76b49270e', 'c3ed7dfe-8950-4c58-a920-18ea42883f59', '339fe229-79dd-4d78-9ca7-79eb2cc78b90', '1df9c3c1-be10-4ba4-825d-809d1038a77e', '42eb86df-8898-4b17-b42c-d060dec3261c']","['tune-mjcf__rw8SRto', 'tune-mjcf__yKe4aot', 'tune-mjcf__gPQTq2F', 'tune-mjcf__tpBdoXs', 'tune-mjcf__QSPc9Fi']",2,"[946.07418, 333.922923, 868.599159, 548.133842, 707.711044]","[14.878575, 24.633832, 10.498409, 15.110994, 27.677861]",0.4,False,"['c3ed7dfe-8950-4c58-a920-18ea42883f59', '42eb86df-8898-4b17-b42c-d060dec3261c']" +grok-code-fast-1,video-processing,5,"['301a20c7-1438-4568-ba66-aff2c1f19fac', '2b8be2b8-79df-47d3-a1b5-785db0a385a4', '4fb4b340-ef1f-4cf7-bdab-e81ae765a07f', '1441e536-a7ae-4ecc-8615-151b96d24b7f', '8eac36a4-c736-436e-b72e-730f6cbc55fe']","['video-processing__AXpmbc3', 'video-processing__DrhBM7N', 'video-processing__KFwwTzT', 'video-processing__vziBMzn', 'video-processing__XRt2Zc9']",0,"[84.751585, 52.054254, 152.243322, 182.58662, 91.194466]","[160.030358, 25.919511, 60.050912, 20.924059, 43.486887]",0.0,False,[] +grok-code-fast-1,vulnerable-secret,5,"['5d6f69e5-d438-4655-96de-eb06766de45b', '814a9719-ebd2-4a59-8318-b0403b0fbf2c', '3db3e388-30cf-4a91-81d9-f335ceab06f5', '0d8e6526-542a-4c3f-937a-3643c7b2826a', 'f892657e-e2bb-41ef-83e6-cb835192931c']","['vulnerable-secret__36v6fLA', 'vulnerable-secret__F4Fcv3v', 'vulnerable-secret__HXSFADU', 'vulnerable-secret__wQtdE8H', 'vulnerable-secret__rV8kR32']",3,"[901.137682, 188.613616, 916.962339, 287.634477, 169.465279]","[10.852526, 29.50428, 16.757257, 11.122369, 13.390813]",0.6,True,"['814a9719-ebd2-4a59-8318-b0403b0fbf2c', '0d8e6526-542a-4c3f-937a-3643c7b2826a', 'f892657e-e2bb-41ef-83e6-cb835192931c']" +grok-code-fast-1,wasm-pipeline,5,"['8ae977fd-44c3-40be-bbec-1c14ebd4fc5e', '77aebeb2-e444-4750-a9aa-5d868a61dc01', '0ee9d999-cb3c-465b-8bfa-4556a81d1c5b', '22d41929-c806-4483-9e54-00b739095465', '81645c37-250d-47f5-be04-241ef8a8482e']","['wasm-pipeline__aoaVpTi', 'wasm-pipeline__kxTdVbs', 'wasm-pipeline__xt9auor', 'wasm-pipeline__tiWqQ47', 'wasm-pipeline__52K5f62']",1,"[219.877135, 595.729928, 737.068533, 223.040669, 315.804973]","[4.522562, 14.547025, 9.799616, 6.977617, 11.352987]",0.2,False,['77aebeb2-e444-4750-a9aa-5d868a61dc01'] +grok-code-fast-1,winning-avg-corewars,5,"['27434c92-02fc-44e2-bc19-28c830395c9b', 'a5b643b9-76f1-455a-855f-fa5f5f06da6c', '0467048b-359c-4fbc-b476-c0da50e7b624', '6cf723eb-7f40-4780-82ff-74895729a479', '7777369a-3e01-4ff5-a2b7-fd87e3795b75']","['winning-avg-corewars__XGWrLyk', 'winning-avg-corewars__zFCLvnS', 'winning-avg-corewars__3LpP3wi', 'winning-avg-corewars__eXwAbF6', 'winning-avg-corewars__N4hFgta']",0,"[107.45215, 1438.55769, 574.616095, 790.302062, 2573.111895]","[83.312613, 5.132025, 37.219414, 36.489635, 15.499651]",0.0,False,[] +grok-code-fast-1,write-compressor,5,"['024712d5-2c9b-4b54-b91c-fc41bfba80ce', '5e4b6f8d-b35e-4793-9f6d-c74b37a9e9e5', '856f3eec-9478-46d7-be29-a42a2b5e8f6d', '5270ce53-3149-4a61-a036-9136d049bee3', '10f9dfac-a456-43b2-9eae-3473912232e1']","['write-compressor__GFPd934', 'write-compressor__x7Dh8S6', 'write-compressor__cpDWJGw', 'write-compressor__G5DgSoE', 'write-compressor__79nSnaD']",0,"[1445.626076, 234.927039, 206.184307, 587.516028, 739.58549]","[188.424277, 47.503429, 76.202389, 40.0098, 176.141897]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,adaptive-rejection-sampler,5,"['7a3f7aa6-f66f-4cab-be1b-efa3b39425cb', '5eb80d76-1da9-499e-bba9-8c4418cbdac5', 'a6ffc56f-5d72-4555-a5a7-8d81dba526a4', '297ee20b-9af8-4c32-ba1c-277a4e76b271', 'a77fd5b8-34f9-4c5c-a566-ab006916f2fc']","['adaptive-rejection-sampler__jH9pcBD', 'adaptive-rejection-sampler__e8vma8p', 'adaptive-rejection-sampler__fjTF6XQ', 'adaptive-rejection-sampler__6RQYmAn', 'adaptive-rejection-sampler__U8XAvay']",0,"[443.831953, 452.566367, 98.180834, 900.032628, 910.351965]","[134.861654, 143.942639, 18.142791, 85.689399, 59.490346]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,bn-fit-modify,5,"['609bf8bc-f2f9-41d8-8618-40232ace33a2', 'c401a030-7ffd-4c07-a2b3-d7bc3e35ff5a', 'f1f5dcc5-d51f-4329-a76f-96a55c9e3015', 'e0ebe836-12cd-480e-afe6-70cac4e65ad7', '6d77b365-7e63-4b88-97e1-20d615634800']","['bn-fit-modify__5LLg5dS', 'bn-fit-modify__MEXnWSr', 'bn-fit-modify__iVg7bP9', 'bn-fit-modify__gCsenTG', 'bn-fit-modify__rxCHZFD']",0,"[1356.639144, 1059.54132, 3600.457142, 1436.95288, 1223.847915]","[20.548371, 200.656039, 14.926703, 101.760857, 61.938678]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,break-filter-js-from-html,5,"['5f8f119c-e667-4b12-84ca-2c15188bddd0', '94371db0-b28b-4a7a-83b1-cfb47a74370b', 'c1f3506c-df21-44ee-bf83-b74b63d60fcf', 'f9a8cd6e-4148-4c01-8899-25228c284cba', '142df19c-8a95-4738-8be5-c698ac9d911a']","['break-filter-js-from-html__3Rmy2mT', 'break-filter-js-from-html__aLLB4pK', 'break-filter-js-from-html__gUodtRQ', 'break-filter-js-from-html__o8vu6gk', 'break-filter-js-from-html__y3gH7ca']",0,"[337.005894, 270.436057, 509.872238, 197.006478, 278.788817]","[17.74309, 37.66168, 116.956647, 43.954685, 46.520512]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-cython-ext,5,"['2a24d1d9-fb85-4f44-a37a-12d2a790692b', '390be1f7-92b8-4ab0-80ab-550db4ffdc95', 'f3c34cdd-6d9f-4117-b0f3-f15ac9b65381', 'b9ba8ec3-16f3-4aba-b771-f0c5ac5b894c', '68de687c-2d48-4eef-8a95-c8fab032bafc']","['build-cython-ext__bvkTATJ', 'build-cython-ext__j3z24Hz', 'build-cython-ext__m3na3a4', 'build-cython-ext__hHSbAvv', 'build-cython-ext__iWGbUFg']",0,"[323.427828, 528.82896, 913.907689, 593.283873, 911.856535]","[31.650059, 66.347093, 33.17068, 134.886917, 69.623117]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-initramfs-qemu,5,"['345e0b57-6323-4dcb-9584-e12f9630348a', '84240b1c-ddc2-4252-a0ce-1f6ddb238e5c', '255fb8f0-e178-47af-8b10-220b12f925d3', '584e6f6a-7f25-4bcc-976a-2b6d4f1baeb3', '4630bdcf-0d0e-49f2-9e6a-4f89ec7959e6']","['build-initramfs-qemu__BqhbpWH', 'build-initramfs-qemu__PN9NRsS', 'build-initramfs-qemu__KdpRXtW', 'build-initramfs-qemu__ZNmK4e2', 'build-initramfs-qemu__WUbiinM']",0,"[907.695081, 91.746305, 59.102325, 552.90485, 226.543982]","[56.318789, 38.129125, 40.24809, 25.070575, 69.349172]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pmars,5,"['15f6e573-c7d8-48b9-be03-3c4ad4de283f', '030828da-6675-4d8d-8d91-cef45fcda67e', '531df2f4-5755-46a2-9812-43bdd2f19fec', '2bc50ca6-a16a-4228-96e3-72dd4e94cd93', '1b46938a-eb1c-42da-83f1-cbc58b211bce']","['build-pmars__9Pkphbh', 'build-pmars__nMkMUhd', 'build-pmars__XpRoA2X', 'build-pmars__Nvhz4Pp', 'build-pmars__2aXwyNb']",1,"[929.442623, 489.769214, 501.241387, 305.964842, 352.270347]","[48.618973, 11.128041, 3.83728, 9.909446, 2.15345]",0.2,False,['531df2f4-5755-46a2-9812-43bdd2f19fec'] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pov-ray,5,"['3100b553-e2f6-479c-9fcd-43164b4b5382', '23e2626c-010b-43ca-b41a-105e2e9743ff', '6a84c62e-9b51-471b-800c-aabca5c0e2e4', '3813e183-9d73-45ce-b6d7-5a788973cb85', '01d61d98-bce0-42cd-b01f-43b334645d7d']","['build-pov-ray__btEGG24', 'build-pov-ray__p9iGpbT', 'build-pov-ray__Gt23XbX', 'build-pov-ray__cMwVtWV', 'build-pov-ray__GbqNqbi']",0,"[508.419533, 4317.453263, 388.846578, 1781.657345, 3782.790563]","[59.953841, 50.432316, 15.959477, 76.344198, 69.724979]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cancel-async-tasks,5,"['6267cf5f-7f9a-4f2c-b56c-e743cb848131', 'c904789f-a043-4520-8b36-86174e51a350', '91a20918-7096-4cd0-9d89-6445f31713a8', '3dd95f6a-88a9-41c9-a147-23a38b77569b', '49b9ab9d-3d94-465a-a132-6e4c59abf7f7']","['cancel-async-tasks__TDRgQpW', 'cancel-async-tasks__aZErjT2', 'cancel-async-tasks__jgGzzAX', 'cancel-async-tasks__EMqjfCE', 'cancel-async-tasks__mAeh6ug']",4,"[70.058497, 101.834606, 68.728694, 178.634469, 101.953262]","[63.861432, 25.266753, 78.122359, 91.349653, 161.094694]",0.8,True,"['6267cf5f-7f9a-4f2c-b56c-e743cb848131', 'c904789f-a043-4520-8b36-86174e51a350', '3dd95f6a-88a9-41c9-a147-23a38b77569b', '49b9ab9d-3d94-465a-a132-6e4c59abf7f7']" +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,chess-best-move,5,"['7839b505-869d-4b41-a79b-30c0a67b9998', '548fad12-326a-47c7-ac45-7f15c1f847a4', 'fea40e70-1131-4734-8163-f6de6762c5fb', 'cc10ca74-b490-46f8-aad8-3b3ee7bc84bd', '376a72cc-6c09-47c9-a9ec-e8317ea6b493']","['chess-best-move__ij9Revz', 'chess-best-move__Hwy6xS6', 'chess-best-move__djCqvgY', 'chess-best-move__GoxMaDt', 'chess-best-move__CNRFKSp']",0,"[331.307165, 348.819779, 348.395831, 179.982553, 205.094775]","[100.152222, 48.059392, 56.252049, 23.930327, 10.155244]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,circuit-fibsqrt,5,"['16c938ab-cddf-4574-a03e-22dfa1e6f20a', 'e05f3bd0-827f-471b-80fa-6933f5160061', '9b6acff1-3b66-4167-a07c-7ecfd3ad2819', '070a75ab-bf12-4028-9cee-7a0533583ecc', 'fdefef4c-9e51-480e-82d9-33cdf28d806b']","['circuit-fibsqrt__F7uYJ4B', 'circuit-fibsqrt__UkWZRkL', 'circuit-fibsqrt__s9uJHUD', 'circuit-fibsqrt__yjNMjvu', 'circuit-fibsqrt__pqZhNZM']",0,"[292.816599, 455.85337, 131.184082, 1145.888043, 3602.424125]","[78.946996, 8.059634, 23.406607, 33.539104, 125.680454]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cobol-modernization,5,"['78302e81-3543-4e55-a824-613628e153b7', '571e0561-859a-44d1-8f66-9f99bd3c0cf3', 'fb93a8a2-b71b-41f3-a598-0828b59b9855', '8e1ba374-b005-4253-9137-67c44aa77c4f', 'a0f86313-2baf-46c9-be00-e7e031832250']","['cobol-modernization__YgCLQgS', 'cobol-modernization__YXkqNd8', 'cobol-modernization__tJBbdkF', 'cobol-modernization__c9WBHTx', 'cobol-modernization__pxuUfbW']",0,"[900.001416, 835.953787, 678.953582, 793.406251, 918.754158]","[37.271487, 52.198233, 47.787363, 53.862547, 118.214645]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,code-from-image,5,"['42d5e0be-1278-4a47-a329-7f155a2dcb62', 'b00e4c95-d8c4-4385-b8aa-724252409d4a', 'b946042c-892a-4d99-bb60-22302b1bff63', '8d88385a-b419-4c98-a348-f99dccf825cf', '9de5fd51-5c7a-4efc-8234-a953a18d7dd7']","['code-from-image__gGarmho', 'code-from-image__cAMokRx', 'code-from-image__ECiDp45', 'code-from-image__5QZTbgx', 'code-from-image__jYSdoHi']",2,"[47.011482, 185.486745, 36.479159, 173.363513, 282.879055]","[19.350345, 59.248781, 15.750334, 42.983057, 33.448939]",0.4,False,"['42d5e0be-1278-4a47-a329-7f155a2dcb62', 'b946042c-892a-4d99-bb60-22302b1bff63']" +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,configure-git-webserver,5,"['ed4880a9-6368-49f7-a946-3844e2cffcb4', '15d9a81e-836e-49a9-ad13-08b3474f03be', 'c35af1fe-f108-44d3-9c07-c30d9bfd3fb2', 'fd489c11-113e-4ee8-8d43-c1f7cdb44481', '7c7d3303-e31f-46bf-8fe6-a7831ee0e973']","['configure-git-webserver__ezkmXEQ', 'configure-git-webserver__ZSvsmHQ', 'configure-git-webserver__3dnFEBk', 'configure-git-webserver__SRznZur', 'configure-git-webserver__YAvQLwA']",3,"[811.789377, 249.225807, 712.381094, 434.918866, 217.175653]","[50.333593, 151.720918, 157.500741, 112.674919, 58.98747]",0.6,True,"['15d9a81e-836e-49a9-ad13-08b3474f03be', 'c35af1fe-f108-44d3-9c07-c30d9bfd3fb2', 'fd489c11-113e-4ee8-8d43-c1f7cdb44481']" +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,constraints-scheduling,5,"['88992378-e256-42d9-9358-2d0596158f62', '4175eb1f-77b0-446d-900b-20e108dbe947', '7bbaed4d-4304-4192-b938-ce14edca0610', '2edd6578-4c27-4cb1-bd17-d334a821eeaf', '9f81c2a8-afe9-4a34-94f3-156edd20e0c8']","['constraints-scheduling__XGZcADp', 'constraints-scheduling__Vb46Xw8', 'constraints-scheduling__kSnHX4w', 'constraints-scheduling__68rpgvM', 'constraints-scheduling__RQWfWnW']",0,"[391.482547, 769.9245, 118.687236, 163.750145, 461.740362]","[131.084041, 49.359468, 24.355968, 37.082756, 146.404343]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,count-dataset-tokens,5,"['62e34087-ec30-47b3-a681-485b37ba4a35', 'b8db87c7-883d-407f-8e47-442a9d4d9ab3', 'ad45fd05-7098-434d-8dea-e086a8e9c296', '5189fbf9-0111-4150-a0f1-9fd78ab8d132', '126dcbb7-324d-4173-9e3c-26705b83baaa']","['count-dataset-tokens__mtEaLbc', 'count-dataset-tokens__5Sfiqbp', 'count-dataset-tokens__U7mqR8W', 'count-dataset-tokens__4uEBtk3', 'count-dataset-tokens__oR5g2gm']",0,"[180.450189, 920.348228, 974.345603, 647.452753, 177.997661]","[35.830412, 138.631273, 44.163978, 100.537829, 39.653334]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,crack-7z-hash,5,"['3e1915da-6f56-4c1c-8599-75bc064649bb', '7c9da7dc-7917-4261-befd-caebb15cd116', '65b3bfb9-c51d-47e5-beff-20be74796049', 'e075ac72-b6d5-4535-aae3-030b145348a4', '4395387f-8a44-4a67-b87c-42431ef0d2ec']","['crack-7z-hash__JDBceeV', 'crack-7z-hash__6ABrQxn', 'crack-7z-hash__K6rCcLw', 'crack-7z-hash__Gt4H3fm', 'crack-7z-hash__o9LCmHz']",0,"[315.384396, 68.802228, 109.678749, 184.537121, 104.553058]","[22.233589, 11.3947, 31.18264, 28.873401, 23.056569]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,db-wal-recovery,5,"['2674f06e-ffdf-4000-99d0-9e9e16f77d94', '5331c57d-b7e2-4004-9bba-8a01fded8bf2', 'afb60f89-d9f6-4894-b6b5-9f35ba9ac2d2', 'b6ed6150-7d59-401d-9c59-d2d400d23ab2', '593b8ae4-9f1b-4e34-8253-0976e2f6db97']","['db-wal-recovery__Djc5W9s', 'db-wal-recovery__qTJ3Sw3', 'db-wal-recovery__gHfoCCv', 'db-wal-recovery__7tn64Nh', 'db-wal-recovery__CzmRHmV']",0,"[245.734725, 152.173643, 42.300927, 414.862851, 62.129188]","[59.665262, 29.978612, 12.624546, 59.744929, 15.905362]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,distribution-search,5,"['4b55825a-b820-4484-99fb-4cf6faa06238', 'f8e30418-bb33-495b-a1e3-a44906c15318', '3be4d6fa-1851-4b67-ae8f-2f5fdd5b496e', '90e9c501-2db6-4538-9815-97fe7b2ce0ab', '54e713a9-949a-47c7-945f-db4b6d2d2fef']","['distribution-search__vwabr8w', 'distribution-search__Q2HzxvR', 'distribution-search__p4H9kDw', 'distribution-search__ykjzaq2', 'distribution-search__XVAiiJK']",0,"[243.073717, 3600.129881, 2071.035792, 305.537301, 432.03825]","[16.414894, 176.650985, 61.805911, 58.021264, 22.804292]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-assembly,5,"['1766329d-0965-4567-931c-021b7ff46521', '7bda02fa-0aea-48c7-8d34-9785892edeaf', '9f2e71fc-04ce-4def-bcd6-760a6e8383f8', 'b61330e2-0a01-4691-8ddf-658e856ae3b5', '242354a3-1c59-42ee-a383-74088c08c2b3']","['dna-assembly__wmQBNWE', 'dna-assembly__CFxzAaQ', 'dna-assembly__BjRDtH6', 'dna-assembly__rWoyuuW', 'dna-assembly__PtraXmJ']",0,"[508.706495, 279.236747, 334.24445, 733.008006, 119.754246]","[44.140535, 59.81763, 35.48872, 51.721893, 41.178541]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-insert,5,"['d4dde4c0-53e0-475a-86b2-d0c815c56884', 'bbd9c1fc-ec46-4167-a537-7462c28bc918', '22e75e91-a347-4cbd-ac29-4f080beca403', 'f6b71d70-b7c6-4606-9b5a-48a07c0f8635', '9ae134e3-a91f-440b-aa91-0d0561414b56']","['dna-insert__WCqWFo4', 'dna-insert__hi7jBWB', 'dna-insert__BUgXuAe', 'dna-insert__WWq4QJM', 'dna-insert__BxQCgbv']",0,"[360.416892, 203.638627, 378.54079, 554.977483, 360.018043]","[267.18661, 17.22747, 14.4986, 30.041314, 22.29442]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,extract-elf,5,"['48139ece-b8f9-43c0-b830-ff8cd34ac5ab', '650e0956-5a92-4842-a328-db3dd871c31c', '6e87e728-0f70-4f4e-88ef-4f417b654a90', '97f8c84c-cef9-46e9-9ddb-95d815169c38', '3f08affe-15f6-4532-85f2-52ce6e853c29']","['extract-elf__9Ej2off', 'extract-elf__xoe25rQ', 'extract-elf__kcot7kQ', 'extract-elf__7SRvkas', 'extract-elf__WpVTGeR']",0,"[297.559173, 175.25702, 274.899049, 242.698079, 150.776812]","[59.006526, 38.169306, 161.932565, 29.204032, 17.998567]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-differential-cryptanalysis,5,"['053c9289-db62-4e76-830f-ac9ddcfef8f5', '77a38917-d85a-4853-8fbd-c0af307184d5', '8f587f5d-0801-4f97-b4f9-19f5b112e74e', 'd1c3109b-e239-448e-8137-211b014cb004', '5476fd2a-cbac-4616-8dad-538df3dad114']","['feal-differential-cryptanalysis__77Tvvgn', 'feal-differential-cryptanalysis__XG4BASk', 'feal-differential-cryptanalysis__A4rWo27', 'feal-differential-cryptanalysis__Fjpz6a8', 'feal-differential-cryptanalysis__ixhaTwm']",0,"[208.933573, 231.038091, 303.201246, 965.669238, 117.847508]","[74.446387, 94.684218, 187.91086, 208.949172, 23.503721]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-linear-cryptanalysis,5,"['52d812e1-f65d-4f7d-9439-fccec6a7872b', '2526fb6a-159a-4109-9b29-394ab7adbed5', '0ef2c5d7-e28b-4c55-8649-5935e00e81d8', '261eac40-4ac0-4533-8a6c-1ace515affeb', '0473ee54-0c86-4581-8902-a4fb39b92a88']","['feal-linear-cryptanalysis__FvYPDfE', 'feal-linear-cryptanalysis__JEPrspb', 'feal-linear-cryptanalysis__mzdjE8T', 'feal-linear-cryptanalysis__ao35cBT', 'feal-linear-cryptanalysis__GL5Ugqw']",0,"[659.535679, 647.888643, 308.497992, 748.764668, 167.917433]","[39.835824, 16.53196, 159.932211, 42.346475, 20.539694]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,filter-js-from-html,5,"['aee19d22-795e-466b-add5-664de2494788', 'f912fa47-df61-49c9-a31c-a11b2afce051', 'b64c92c0-0961-4d3a-b574-b86bb1274980', '6bd0cc3b-f75f-41c9-b56f-f0253e395c8a', '46d89796-e6d7-415e-b8d0-5f3f3d938aaf']","['filter-js-from-html__58rSadF', 'filter-js-from-html__ZuTWmPR', 'filter-js-from-html__M6zB9Hu', 'filter-js-from-html__77GCtMk', 'filter-js-from-html__9edc2yw']",0,"[21.252784, 67.69575, 118.673897, 81.386927, 611.113985]","[20.583037, 21.409449, 22.129982, 24.884424, 41.494858]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,financial-document-processor,5,"['f649f426-bf84-41c8-a076-130782763dfc', '781c84a8-c6da-41b7-9e61-50c700a288ba', '4a120157-5af1-4313-9897-288c67b8d002', 'f0d343fb-6ea9-4a4a-a397-21ae4bfdc84c', '1b61a5c5-37e0-4ade-b668-98b94419791d']","['financial-document-processor__6gmJ5Tw', 'financial-document-processor__aA5cfpH', 'financial-document-processor__27ZBYVE', 'financial-document-processor__jyhcCm3', 'financial-document-processor__D6rzKe9']",0,"[86.600112, 890.061216, 641.888099, 87.426206, 255.456439]","[254.113719, 20.656735, 78.744489, 105.546605, 48.413655]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-code-vulnerability,5,"['2fba23b9-6920-41e2-ba80-5baae420cd47', '6589165f-d71c-41ff-b139-ea158ac4eb47', 'd758d4fb-cbcf-4979-912e-978e826107a7', '7e4071e9-b597-48a8-bab7-d761c0744c30', '2d16700d-01c1-4eb9-b6fe-72fd28afbef0']","['fix-code-vulnerability__ZUThhxy', 'fix-code-vulnerability__a8eHcMc', 'fix-code-vulnerability__ijuTdU7', 'fix-code-vulnerability__aNQJ5mi', 'fix-code-vulnerability__A2E3bse']",0,"[900.055103, 900.882931, 982.605331, 1062.355889, 909.955602]","[11.484988, 5.351041, 38.779384, 5.926621, 8.221681]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-git,5,"['268e8eec-16aa-4301-be7e-3a7ef529fc80', '65d04922-ca6d-482c-a6eb-9763f0936706', '7c278c4a-89d3-4b06-a594-1a7903cd80f8', '37c8c9d8-62ba-4b65-8f8e-c69688f862b2', '6140b0e4-d434-46ba-951c-06e778d13652']","['fix-git__ydn85yA', 'fix-git__UYHP5jo', 'fix-git__Eub7N7a', 'fix-git__gvosvod', 'fix-git__DNE5KgW']",0,"[551.904755, 900.035437, 73.546742, 101.84988, 140.804019]","[33.310676, 61.062588, 24.070601, 13.816383, 53.131651]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-ocaml-gc,5,"['6fd820be-b25e-4425-9c6e-5c63969c1065', '72dec8b9-abef-4db2-9120-ccd6b100adad', 'b7dfa100-d590-4f89-930e-60354663b18b', 'f1657e05-45a0-4369-a05d-10b4c50dcdb3', 'fb47150a-2a37-4c06-b30e-45bfd46fb26a']","['fix-ocaml-gc__Mg3QHi4', 'fix-ocaml-gc__rNonjuK', 'fix-ocaml-gc__vwBXUXL', 'fix-ocaml-gc__emcymhc', 'fix-ocaml-gc__vKXbG2S']",0,"[3602.848726, 3740.400352, 3602.62982, 801.922854, 1780.07684]","[82.401526, 24.04876, 36.378456, 32.899576, 39.447278]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,form-filling,5,"['98742de8-4277-4360-a635-3637adc1e4f1', '741f502d-7463-49ee-a2dd-4010804303b5', '3c3e2a01-8ab5-44ae-87ca-4ddf8e440247', 'a037118f-0681-4c65-a731-72bd3e2159ca', 'd1316069-d1c1-4d4f-93bf-27372190b9fb']","['form-filling__eSBhHw7', 'form-filling__xT7frnz', 'form-filling__joWZozU', 'form-filling__3PiqVX8', 'form-filling__SDtrV5M']",0,"[211.917987, 781.053363, 322.849715, 249.79161, 286.281921]","[14.917155, 17.870306, 3.48432, 9.381006, 70.521735]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,git-leak-recovery,5,"['cb9c8422-c024-410c-ac0b-2be8a204cd66', 'c5382eab-2619-4eab-bcd7-a399476c9e49', '4284deef-8436-4a92-9185-205bf3cacbde', '464cd2a9-bd38-4f3a-aa3a-88d5711fe689', '945b7dc1-8899-406b-b648-4cb0c9e6337e']","['git-leak-recovery__ncTEgPG', 'git-leak-recovery__LzSxo8h', 'git-leak-recovery__MbhTjkZ', 'git-leak-recovery__BQWwWPj', 'git-leak-recovery__xzYHMxW']",5,"[93.864496, 145.433655, 116.743747, 855.601774, 193.680403]","[22.641398, 109.33106, 36.190508, 37.187662, 40.870093]",1.0,True,"['cb9c8422-c024-410c-ac0b-2be8a204cd66', 'c5382eab-2619-4eab-bcd7-a399476c9e49', '4284deef-8436-4a92-9185-205bf3cacbde', '464cd2a9-bd38-4f3a-aa3a-88d5711fe689', '945b7dc1-8899-406b-b648-4cb0c9e6337e']" +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,gpt2-codegolf,5,"['56ae61d4-faaa-4104-a6df-1b68bcd4ce7b', 'aa5398fa-5ba3-4216-9a7e-23b9d94b92b2', 'e0b75daa-1c65-4263-86ac-646d7906e36b', 'c95b07d2-7d0b-4d82-bc82-039d5c129240', 'd7511421-da50-4bbe-a619-5586b20bea5a']","['gpt2-codegolf__i4LcCen', 'gpt2-codegolf__nXuqnEG', 'gpt2-codegolf__jS57ef3', 'gpt2-codegolf__bRKpUZ3', 'gpt2-codegolf__JoG3f6K']",0,"[338.160201, 245.821412, 242.081573, 157.378371, 170.261898]","[232.16668, 127.70186, 85.983622, 19.712883, 9.296963]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,hf-model-inference,5,"['e7a28c2d-e4a6-4bba-afad-04134ea4b4e5', '55beffa3-bc8c-4001-8726-fadc1fb3b5dc', '1bcbf4b8-2e6b-4b7c-949d-6e56a4c7addb', 'b14d6774-d891-4203-a46d-71b1444df992', 'd5e5a5fe-4d0c-4a57-bc27-01c1f63e65bb']","['hf-model-inference__Hj2bZpS', 'hf-model-inference__mN5DPj4', 'hf-model-inference__dkFr5CU', 'hf-model-inference__2STQXNP', 'hf-model-inference__kx3r73f']",4,"[102.926319, 109.809239, 894.896704, 122.927531, 178.737748]","[35.659686, 28.47753, 163.947452, 26.446477, 35.260766]",0.8,True,"['e7a28c2d-e4a6-4bba-afad-04134ea4b4e5', '55beffa3-bc8c-4001-8726-fadc1fb3b5dc', '1bcbf4b8-2e6b-4b7c-949d-6e56a4c7addb', 'b14d6774-d891-4203-a46d-71b1444df992']" +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-klee-minimal,5,"['6eefad9f-1b07-4d90-8b80-8a53d6f083e3', '43b89775-8f8b-473b-9225-0f8d42d1c4df', '2111477c-5a7b-4738-9125-399df8e29567', '85b875e5-39c2-4a37-8a9a-a04fc20b3404', 'bde404ca-0f41-43a6-b5ba-422c1815aa3b']","['install-klee-minimal__Yg8VucH', 'install-klee-minimal__acjmFmq', 'install-klee-minimal__jgVYWPe', 'install-klee-minimal__u3YpHMq', 'install-klee-minimal__de9KTEf']",0,"[1730.283575, 803.787656, 907.342612, 904.160487, 900.013688]","[49.164528, 38.277293, 200.493364, 113.37073, 90.302296]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-windows-3.11,5,"['4e9690a0-647b-4a23-8f7a-5af107c2da6e', '57f0d009-60f9-479e-8556-ab0ad4d2ed68', 'e0605fe4-17b8-4728-81bb-ceef585de0b6', '3905f39f-c343-4047-81da-e09760ba7025', 'be73d57f-9a9d-46b0-be33-d67320b4c4f7']","['install-windows-3.11__jXFk95N', 'install-windows-3.11__JWpWEXS', 'install-windows-3.11__xsPqNtJ', 'install-windows-3.11__x5betXj', 'install-windows-3.11__iyQdBsG']",0,"[199.669191, 206.796109, 385.069929, 154.505019, 145.051022]","[27.739113, 39.940761, 32.105137, 33.834671, 32.296589]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,large-scale-text-editing,5,"['03d03caf-4ee8-417b-a4bb-8517706b9f46', 'efb8c4b4-7411-4c5d-a449-d5d4f6cf1f20', '8bf231b1-040a-4d2c-b85d-f34555e38d77', '4aeedd1e-a433-4484-82d2-839b24e7c502', '19594301-ef2c-47fd-a231-2775535c8bfc']","['large-scale-text-editing__eDwNSaW', 'large-scale-text-editing__oyhGk89', 'large-scale-text-editing__7PhVCDX', 'large-scale-text-editing__bf3LGsW', 'large-scale-text-editing__XpLfm2t']",0,"[418.408032, 73.994836, 251.051767, 177.826574, 234.161902]","[215.885075, 13.905223, 137.163686, 18.464695, 65.381501]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,largest-eigenval,5,"['32bf7861-fca6-449d-a9d0-94309bc8ae1c', '1f3e5db6-b627-4ace-bd70-be90a2aa6c3d', '2a1ffe06-9243-4547-a979-859aa768204b', '4c40dec6-6d4b-4fd5-8552-e0ee6ad2768b', 'c07652f4-dd0c-43b6-80d7-a6ce535b2d15']","['largest-eigenval__aGoBhMT', 'largest-eigenval__rYzrMuk', 'largest-eigenval__y2Zt2zb', 'largest-eigenval__eWTMeSf', 'largest-eigenval__kpGqwCT']",0,"[435.740243, 585.776452, 299.38884, 913.220029, 907.211007]","[51.863351, 89.021691, 21.243629, 187.037358, 36.57869]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,log-summary-date-ranges,5,"['37c36cea-c799-40ba-b8d2-30f80711d9c5', '89ae7ef6-f48f-475e-845c-f25139fe011c', '29748f49-c251-4ddd-a308-cb928cc39b5e', '371272f2-e40d-41da-a6cf-a42b7a406413', '86576d8c-6f2f-4603-8c6d-093454315e86']","['log-summary-date-ranges__dTLHdjS', 'log-summary-date-ranges__aTK5335', 'log-summary-date-ranges__Z9CcFQ7', 'log-summary-date-ranges__8FGEwKL', 'log-summary-date-ranges__aKSHivz']",0,"[258.871112, 115.628928, 128.638703, 103.066969, 172.084493]","[30.136774, 16.756118, 34.04871, 43.186101, 50.664374]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-doom-for-mips,5,"['692df3a5-85b6-40f2-be8c-52c4deb85f96', '8bff6887-db91-45f7-993c-fe9a6b11124f', 'f0d20d55-412c-4831-b731-a405f63c9ae6', 'dc7859da-6d76-4729-8bdc-f0185ddc6c30', 'ff474af8-dabe-444d-b840-3459de901912']","['make-doom-for-mips__5b2UnMY', 'make-doom-for-mips__b7gjcKZ', 'make-doom-for-mips__PUiWFnp', 'make-doom-for-mips__uD2z45s', 'make-doom-for-mips__c75mpa6']",0,"[793.212135, 186.107043, 363.680174, 479.80599, 916.591087]","[34.935737, 160.63096, 105.494609, 42.708345, 23.10511]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-mips-interpreter,5,"['0629b921-5023-48da-9581-c09e07980824', '9f80c14f-16be-40a1-a6b3-8b56d668238a', '0d1996b6-6af8-447b-9518-3aa08cd94470', 'd77d25a3-d14a-49cf-9b61-1bd93315d651', '3fd577a7-20de-4eaa-9c93-63dee9019e49']","['make-mips-interpreter__SSzaUDa', 'make-mips-interpreter__2G3AH9x', 'make-mips-interpreter__ZGqJ6vY', 'make-mips-interpreter__xooqFYB', 'make-mips-interpreter__tVMgEwE']",0,"[1839.633245, 1111.243218, 1105.655288, 1800.767036, 1808.34095]","[86.319655, 205.425788, 10.665618, 50.374821, 79.462857]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,merge-diff-arc-agi-task,5,"['fb7ce6a8-1731-4ba8-beaa-e05eeecbf57b', '4da9c447-3511-419c-993d-fef9a35dd0cd', '638fa9f7-fd43-4f40-a0a9-222a248993db', '4494f62e-961f-4455-80f3-89d9c1c9c10c', '27f34435-87e4-4aae-85a4-1b12f7a2ffe6']","['merge-diff-arc-agi-task__CQxX8Uo', 'merge-diff-arc-agi-task__m5FfFoA', 'merge-diff-arc-agi-task__2Ads36i', 'merge-diff-arc-agi-task__YPAHgBn', 'merge-diff-arc-agi-task__EV3GNVQ']",0,"[934.984083, 168.27478, 900.460495, 900.244142, 149.666435]","[44.689005, 13.790154, 19.586971, 92.506042, 65.669393]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,model-extraction-relu-logits,5,"['c47de1c0-bc5a-41b2-8119-96cef019fd54', 'afb23def-2fbe-4d50-949c-e47b1936dab8', '7759896f-4d72-4d48-84e4-eaf18d9cf937', '71b2cadd-4c07-41d1-94f4-c3c6ff789110', '7262a830-bc7f-4d42-8ed9-90bec1790942']","['model-extraction-relu-logits__NkFGyrm', 'model-extraction-relu-logits__q6cn6z8', 'model-extraction-relu-logits__u2RJLA6', 'model-extraction-relu-logits__SCPaQU4', 'model-extraction-relu-logits__4SbtPSy']",0,"[194.910346, 278.303463, 82.556417, 136.147757, 108.303099]","[206.009756, 258.534361, 20.1899, 9.38187, 51.739388]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-leaderboard,5,"['2074395e-72ba-495c-aac3-52cb348aaefb', 'b11a9242-99d6-447c-ac66-423240bb92fc', '80f3b88a-e759-4644-adf0-d694567f935a', '5448cde9-71e6-415f-8499-cfc4d2fb4870', '9a390507-2ea7-41cc-a572-200d550b6c5d']","['mteb-leaderboard__PfXbWv2', 'mteb-leaderboard__pBa56B3', 'mteb-leaderboard__QiMY6ob', 'mteb-leaderboard__BL6Fd9G', 'mteb-leaderboard__TcR8KGN']",0,"[296.550172, 281.57408, 195.191571, 168.491044, 142.146844]","[70.393663, 21.724571, 11.502529, 4.567054, 16.420916]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-retrieve,5,"['97c0c036-f35b-43bd-ad4e-361e13d3adf3', '41f57a35-8638-4ee8-ba5e-e86de07b3275', '0fd2cc0e-19f8-4c4d-b38b-c3213054f032', 'd59d5a20-f553-4305-b7ae-09fca34aa8c8', '8b40e7e5-2617-4f21-839d-f7db09730e5f']","['mteb-retrieve__QvnJisz', 'mteb-retrieve__Ehiapx7', 'mteb-retrieve__kWqZ4wJ', 'mteb-retrieve__kxS3rsF', 'mteb-retrieve__V2PEgTm']",0,"[223.729267, 56.006153, 89.418395, 692.044962, 239.285989]","[9.96711, 86.816316, 3.259817, 111.094039, 9.733968]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,nginx-request-logging,5,"['cae55284-767b-4ebd-86ef-3e06a9b9bbd1', '446f5c8d-1333-4a32-be63-274d95b88d41', '17323233-52d7-46e3-9451-02d01b0c8eaa', 'ec628432-aab1-4922-8169-5e96720b2162', '64630eaf-d90e-4033-b7ad-7d2a0996e2c1']","['nginx-request-logging__Lvqrb8s', 'nginx-request-logging__yR95NqN', 'nginx-request-logging__wGTpQPv', 'nginx-request-logging__UhS6g8Z', 'nginx-request-logging__teEWxdm']",0,"[126.59226, 539.455068, 516.70874, 212.602059, 671.900416]","[52.348583, 38.347891, 89.095702, 34.795871, 61.439125]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,openssl-selfsigned-cert,5,"['804384d0-f540-4ce8-86db-7b9e66721dbc', 'cea91da9-81c5-46ba-a157-da8ea000859c', '5018f689-0021-4208-a8ab-6122d6ffe698', 'e494e657-f427-4915-b6c0-5afa96fa3d07', '4ef30e0f-09d2-441b-b98e-6478ec31defa']","['openssl-selfsigned-cert__8XuL3ER', 'openssl-selfsigned-cert__K8ie3DE', 'openssl-selfsigned-cert__XBkEMX8', 'openssl-selfsigned-cert__AjZokDM', 'openssl-selfsigned-cert__p7h2q8X']",0,"[122.044992, 113.553917, 252.476998, 78.41501, 44.371112]","[58.105001, 17.419775, 66.755126, 27.573196, 14.724864]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,password-recovery,5,"['2bd62ac0-fae2-40c2-8a7a-1812094ce5c5', '43e5e073-eb9c-4642-ab77-b78613892852', '069d7ca8-b547-4f96-ba27-e935985b8439', 'bdf9e342-ef02-49a6-8e19-f86caf176a0b', 'fe13e430-f84e-4245-9e5a-8788f0b616bf']","['password-recovery__qFcmK3v', 'password-recovery__3xpwPa5', 'password-recovery__JdRxnbK', 'password-recovery__D4jNvmU', 'password-recovery__ghdMiQy']",0,"[136.873587, 187.252973, 1324.457706, 196.82905, 555.30096]","[27.132938, 51.22827, 268.000254, 35.150383, 27.580639]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing,5,"['275e8b82-891d-46de-a580-68ca4def2ee8', 'c930e187-e83f-48c5-a4ca-b9ff889210c8', '4d195acf-28e9-434f-abbc-be91853b8e4a', 'aef94f94-62d5-4af6-b099-ee82ba5e0c03', 'e075940b-9c24-46d5-9b9c-959893b67c63']","['path-tracing__nfbe9y9', 'path-tracing__jmbVhXb', 'path-tracing__ZoP499H', 'path-tracing__cQMnBgz', 'path-tracing__zjbnnad']",0,"[273.046074, 602.096762, 357.47181, 90.968048, 450.005837]","[46.813609, 105.925436, 38.264099, 44.443192, 34.455314]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing-reverse,5,"['174614b7-18f5-49a4-930b-09a24b899f5f', 'af25f61f-d195-4b62-a981-5f9578096df8', '4bbc06d6-d03e-4130-87fb-62b645f8230e', 'e5439a3f-7ba5-4a25-8513-891bb22a313c', '8a2a6aa6-40ae-4c52-b368-857173911a92']","['path-tracing-reverse__Wdh2TZW', 'path-tracing-reverse__oiTuayJ', 'path-tracing-reverse__bcDW5So', 'path-tracing-reverse__wNPsY4Y', 'path-tracing-reverse__eietuxT']",0,"[304.827997, 210.439191, 698.288089, 949.059229, 467.653959]","[38.154551, 18.330192, 37.140348, 64.425026, 111.531673]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-c-py,5,"['9f4fd13d-98f2-4b1d-95e5-a5b3141c2bde', '0a83829c-c44e-4ab6-9cfa-6418dd9037be', 'fd71404b-c7e4-478f-9e7c-b27d47186994', 'd0854df0-1c07-4d90-bb05-55c256631343', '050f40b6-f8fc-4f0b-a599-8c4aced4d44a']","['polyglot-c-py__ZAMC4FV', 'polyglot-c-py__gB4nHkF', 'polyglot-c-py__tbyb8KM', 'polyglot-c-py__2jZySSy', 'polyglot-c-py__wp8JkXr']",0,"[72.777524, 757.492192, 78.489297, 117.323132, 193.214625]","[29.728931, 53.758999, 57.984568, 19.415107, 18.943557]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-rust-c,5,"['775a18bc-c52a-4805-88b1-c0c10191a837', '49bebc3d-28e1-48d2-8d08-f023fb44d323', 'fc51335c-0530-4216-aa91-df9e144e442f', '61fadb13-c0d8-4c67-a51e-0748db8deb9c', '1612d9f0-2390-4305-a058-641caf92a327']","['polyglot-rust-c__FjHHt3m', 'polyglot-rust-c__D8X2N6T', 'polyglot-rust-c__XbngPHS', 'polyglot-rust-c__k6wXHCB', 'polyglot-rust-c__3NXzCs7']",0,"[340.353375, 301.09723, 184.874006, 209.510837, 314.795301]","[119.770238, 58.565183, 94.538862, 179.953556, 57.892958]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,port-compressor,5,"['7f4d951a-b4c0-401d-a745-68e00ce7d4a0', '74f22536-99cd-4868-a42f-729d38d9557a', '325d2035-375b-4b45-a702-330cd8554324', 'c0311797-999a-4830-bc01-b1e54e30bc73', '49185b8e-9a4a-4426-bd1e-2797344e2377']","['port-compressor__zHQAiYr', 'port-compressor__AkYwhsa', 'port-compressor__v2wCGCL', 'port-compressor__hsEmTmo', 'port-compressor__bdoq32x']",0,"[947.739082, 3600.006561, 3613.524651, 3601.871482, 3600.001877]","[38.827806, 61.003876, 136.483815, 180.005896, 241.135165]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,prove-plus-comm,5,"['c529bee6-4438-4267-989c-ab9b5898be10', 'ecc90827-bd06-4590-b9b0-7be15348cbac', 'bc86da49-4e7d-43f8-82c2-285937f191ae', 'b2860e8f-0ee3-42b2-af10-ad425d7d089b', '818d564b-80cf-490a-8854-29094810443a']","['prove-plus-comm__yCZXAzi', 'prove-plus-comm__bxRfh58', 'prove-plus-comm__dfnnN2G', 'prove-plus-comm__L2AUzMJ', 'prove-plus-comm__VfeinTP']",0,"[277.914475, 393.231077, 43.522987, 80.412506, 235.731166]","[29.826554, 139.766221, 26.059525, 59.962465, 95.754563]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pypi-server,5,"['a3cf9822-dbcd-4023-b781-dc16820f448a', '0f9ff584-d3a6-47c9-b8c8-865b1666693d', '9e259cdf-dbfb-47c8-9766-540e0a15b510', 'c20f0d66-09f1-40af-8f70-cb209fc32bfa', '3ac84d45-25ae-4f88-9e30-d17dd0403675']","['pypi-server__wxXp3PM', 'pypi-server__EVWs4eA', 'pypi-server__usxRYhK', 'pypi-server__rkk377o', 'pypi-server__s7ifTyn']",1,"[558.133171, 359.145954, 718.81295, 167.781209, 128.646041]","[34.284539, 11.993968, 105.586534, 21.924235, 21.340807]",0.2,False,['c20f0d66-09f1-40af-8f70-cb209fc32bfa'] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-cli,5,"['e56e2182-7af5-4dde-8cad-0c555badbfcd', 'db6da5a7-058a-4629-8e7f-fc363c46ca1d', 'e15e2e63-0492-4377-b33c-a935e1cbb7ab', 'a9186817-c1f5-46c5-b9a1-44269c5712c8', 'b06f5648-447b-4a39-9e86-6a5c4ab33b8c']","['pytorch-model-cli__FK5icKD', 'pytorch-model-cli__FyhHABB', 'pytorch-model-cli__YDGsg7t', 'pytorch-model-cli__BsUDXtf', 'pytorch-model-cli__dU77JDZ']",0,"[134.009373, 902.028783, 196.332793, 1174.397936, 160.840025]","[48.403253, 125.704254, 33.560021, 95.385623, 98.829212]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-recovery,5,"['1083dc22-2909-4d28-9026-e515d6cf8efe', '61155f11-74de-4682-b4a8-60fb74609b47', 'e76868f1-86b9-47a3-9928-2c714b562908', '69974c12-9460-4e5c-976a-bcf1cdba8684', 'c8798727-9608-4677-a115-60c304852b82']","['pytorch-model-recovery__LdZAS4s', 'pytorch-model-recovery__yvLpQnw', 'pytorch-model-recovery__Ps89d4P', 'pytorch-model-recovery__rq9cPcM', 'pytorch-model-recovery__53wF9U5']",0,"[242.533156, 644.098194, 924.298777, 904.304517, 900.669141]","[68.966229, 13.845346, 48.236642, 52.884722, 30.999264]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-alpine-ssh,5,"['04ac7774-e89b-4375-951c-ec9170f30284', 'cd8e5bda-3f26-41cb-a107-1c5930e29bbc', '49e9a6df-bb66-4748-802c-90236c2b0431', '123ff3ca-2c6c-41db-a9a7-079c21ea44ac', '5572e163-9e93-4bae-936f-cf990fd45e3a']","['qemu-alpine-ssh__Cy64M9F', 'qemu-alpine-ssh__jBvVJ7h', 'qemu-alpine-ssh__rdBTjUm', 'qemu-alpine-ssh__G2ENJ4y', 'qemu-alpine-ssh__pcr6uTh']",0,"[106.73237, 293.417581, 181.289747, 127.505093, 102.067955]","[4.467792, 48.268518, 4.670382, 5.095227, 5.190613]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-startup,5,"['56279176-9b1b-41e9-acf8-d2b77ff99f16', '4c683ab1-5dcc-47ea-af28-3d921842ce2c', 'd7b35b3c-d36e-403e-8160-f1e5d9dfc1d8', 'df93a0c1-4a8a-4783-bbde-c745ff4aec67', '6819fe3a-fbc7-45f0-8b81-63d3d6d092b6']","['qemu-startup__ipoqV5J', 'qemu-startup__jKAtLk8', 'qemu-startup__KefTKDZ', 'qemu-startup__Epxxom2', 'qemu-startup__aGpDw7M']",2,"[228.085108, 96.133406, 453.121868, 476.429801, 137.037577]","[17.706559, 6.707353, 6.417834, 10.918758, 4.117721]",0.4,False,"['d7b35b3c-d36e-403e-8160-f1e5d9dfc1d8', '6819fe3a-fbc7-45f0-8b81-63d3d6d092b6']" +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,regex-log,5,"['2e4bd1d6-0972-4a93-af96-d663469d7e56', '1254d544-f93a-4598-a42a-ced14dbcab43', '4958dae9-e076-4be4-8684-c2640a38a643', '10e4783d-31c5-4116-a557-a8fe6686f4e7', 'fe450c50-fa93-43fa-a7f6-5063274306f1']","['regex-log__SJprxaL', 'regex-log__hT7rRCS', 'regex-log__SreXGDh', 'regex-log__MkJMZEU', 'regex-log__AoXkZx4']",0,"[68.106004, 625.376828, 79.010063, 85.422594, 46.768913]","[96.064408, 158.323283, 83.812719, 61.048615, 37.974975]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reshard-c4-data,4,"['a8df9ae6-5894-4908-ae10-20cf096a68ed', '912644b7-e32f-4db9-8b8b-b482c7609afe', 'eccf9b86-76f0-463e-9749-36dcfa9063cc', 'bf5a5972-1e5b-4999-8849-95938f9e85ff']","['reshard-c4-data__fstSFri', 'reshard-c4-data__aFpuinL', 'reshard-c4-data__MbpUXWU', 'reshard-c4-data__ZeUqDdM']",0,"[378.618312, 408.790879, 480.301997, 279.981902]","[269.603504, 45.504852, 213.777513, 98.208801]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reverse-engineering,5,"['7aeec8db-253e-45cd-bfb6-7ec00db319cc', '235801ab-a88a-4838-8e2d-d04988be3556', 'a2556c43-39f5-42f9-b9c5-fdee28dda496', '49f7029c-e89a-4ab8-9912-20cff8f06eee', '8d45bd04-bc18-4ce0-af7f-c9c8446aaeba']","['reverse-engineering__Wtcgbeg', 'reverse-engineering__gHey5pC', 'reverse-engineering__A8wuuxE', 'reverse-engineering__vxrv8sq', 'reverse-engineering__akKFunT']",0,"[702.84289, 230.139471, 715.187133, 330.294595, 503.58089]","[26.495439, 43.710548, 47.414767, 156.313853, 57.887182]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,run-pdp11-code,5,"['43d41eec-c1ce-4811-a9f3-709100cf4b74', 'f52872bf-7858-4875-85b8-93ad80211795', 'e002ea60-df41-428f-a2e1-ffca3abe586c', '40546e59-25d0-4530-8155-6a294d001126', '599e85e8-e990-4392-a213-0609027773a8']","['run-pdp11-code__QYKNTLX', 'run-pdp11-code__KewmfsM', 'run-pdp11-code__JoPPmaZ', 'run-pdp11-code__6v8xXWy', 'run-pdp11-code__atszYe7']",0,"[456.179936, 141.756492, 181.911207, 1064.583774, 309.008897]","[131.884796, 46.562831, 21.136313, 268.91491, 13.144772]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sanitize-git-repo,5,"['73862c80-9049-4cc8-9b69-1dff8c4742ae', '9ce965b7-512c-447e-bd03-c41ac2746f4b', '870b8582-653b-4e67-a8e8-1848ce204ba5', 'd3a19304-a725-4868-9bc0-0df4651d34d2', '0ea087ae-f546-49b5-b4ba-465a75adabe4']","['sanitize-git-repo__hwL2sk5', 'sanitize-git-repo__8Sf2UWa', 'sanitize-git-repo__iFHd2nY', 'sanitize-git-repo__GoUpUHH', 'sanitize-git-repo__Nm22Af4']",0,"[133.443598, 436.979807, 127.287694, 372.027776, 205.627928]","[47.570885, 63.948072, 8.602264, 280.611725, 125.306033]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,schemelike-metacircular-eval,5,"['09719bbf-1866-4560-bf4c-d6831caba628', '5242981e-10aa-4a7f-a2d4-64822a4db2af', '77f7aeb1-5d27-4100-9012-cb2286ed7180', '34b25c45-b0ba-4f79-9f03-e9270de7ec2c', 'df555d26-9e80-4b31-836b-0513732216e5']","['schemelike-metacircular-eval__y4FfooF', 'schemelike-metacircular-eval__5asgDBA', 'schemelike-metacircular-eval__hotCT5K', 'schemelike-metacircular-eval__aYatt3H', 'schemelike-metacircular-eval__3zm3TPZ']",0,"[110.246145, 1296.427146, 212.851608, 1564.096975, 399.608925]","[30.929499, 22.412829, 38.102733, 13.623881, 39.921821]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sparql-university,5,"['8996f43c-62b5-4d28-87f6-d4bb845087cb', '55410dd9-1fd8-4661-8e32-d09b7948300d', 'a9753015-2283-4eca-b470-cf84e34091b5', 'ef7bc6f1-4814-46de-a337-abe419867f9a', '9030fee1-e03c-412e-a189-a1021b294bfc']","['sparql-university__MkXwXmZ', 'sparql-university__YX7avtk', 'sparql-university__LoW4UbW', 'sparql-university__NDtgwDr', 'sparql-university__DiNRcUa']",0,"[41.159927, 929.961259, 57.438985, 595.921087, 102.630775]","[59.013286, 48.885057, 22.352232, 223.805463, 31.957616]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-db-truncate,5,"['9c70a4c1-925e-43f4-8057-2fa47fcddf75', 'd2edec26-1382-4e3a-a570-eb55de09f260', '53f37b48-29fc-4014-ba84-9dff7882a6e6', '57d30762-11a8-4931-8177-c1f4ad095aa7', '2d301cdc-1a07-4ded-9057-ee70e030663b']","['sqlite-db-truncate__TLaCY3P', 'sqlite-db-truncate__dxMJGiZ', 'sqlite-db-truncate__2DHM9Hz', 'sqlite-db-truncate__sMQWUPA', 'sqlite-db-truncate__AHahQt3']",0,"[277.26134, 147.813211, 603.436217, 212.356638, 190.971173]","[61.103098, 103.86988, 137.698888, 13.014237, 23.47129]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-with-gcov,5,"['b5a614e8-c774-4f8b-b82e-053e135e475a', 'f7b1dcee-8e5c-48e5-966a-3f61c7bd2d35', 'dac61496-2f32-4e62-9d21-57f4a92cbe78', '04ae2cfa-431b-480f-b18e-eb36b67e8d92', '272dd981-598a-4cec-a6ea-1e1aa5003c26']","['sqlite-with-gcov__4uGdj86', 'sqlite-with-gcov__M7ZdDVS', 'sqlite-with-gcov__RD7JR5A', 'sqlite-with-gcov__5Ug8spc', 'sqlite-with-gcov__Ud7tgAw']",2,"[123.837943, 145.642585, 275.817919, 266.825228, 466.470159]","[18.8751, 26.635077, 29.553513, 76.160939, 66.702182]",0.4,False,"['b5a614e8-c774-4f8b-b82e-053e135e475a', '272dd981-598a-4cec-a6ea-1e1aa5003c26']" +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,torch-tensor-parallelism,5,"['3a05787b-6b08-4a93-8da8-33450486b97a', 'b9ec74d3-3538-4eed-925e-c746b037b41b', '9e7e6013-d316-401d-9db8-4ee78c7f2caf', '0ed40dd5-8061-4dad-9655-cfc224202cdc', '2e19f58f-2db6-40f5-a42b-0aad62d039dd']","['torch-tensor-parallelism__7CFhwxb', 'torch-tensor-parallelism__MHSNPQ5', 'torch-tensor-parallelism__jTXkQZf', 'torch-tensor-parallelism__aBdaPa7', 'torch-tensor-parallelism__kaznR6o']",0,"[70.14437, 264.292741, 52.583436, 160.969453, 46.171417]","[22.949511, 88.6936, 23.930013, 21.540981, 213.112437]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,train-fasttext,5,"['6e48cdd4-fb0b-4d1c-a01e-28d6231d3fba', 'e126aa9a-08cc-4aa1-bd15-81c5bcf483d4', '4ffafc8b-7fd7-45fb-ad20-22d8216006bd', '6ceb5cbf-90a1-49ca-bee5-b7467d963fd9', '8311d80e-48a7-4b96-8df8-c22defb54d7e']","['train-fasttext__vRJiVdJ', 'train-fasttext__hgLem3D', 'train-fasttext__tyvdAaq', 'train-fasttext__x87r8NZ', 'train-fasttext__GW4V3B7']",0,"[865.611724, 495.528503, 1005.663952, 507.799676, 2037.41666]","[25.143587, 36.73542, 58.656149, 30.751787, 75.757311]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,tune-mjcf,5,"['03e297f7-5713-4f58-a832-08c5bde03d26', '4d81f75d-8f9f-4466-92d8-310acfb90546', '106afd33-2aac-4f17-8d8f-198342f7bde5', '68f8aa93-d7fa-4ae9-b791-5d420f3cd223', '59caa329-bdb3-48ad-92e4-c817e42853d1']","['tune-mjcf__wYLTvNJ', 'tune-mjcf__UjUD8Uw', 'tune-mjcf__x2QQs9D', 'tune-mjcf__bUp33fw', 'tune-mjcf__HZHrHb7']",0,"[476.42247, 926.874961, 224.108556, 907.127844, 534.280481]","[45.451316, 14.453826, 17.968965, 24.389652, 10.081915]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,video-processing,5,"['4a36f880-8c1c-4050-8338-d3f08073109e', 'a3c97c9e-32d1-4d8c-9528-d2cea743ca93', 'b2b6071d-00c1-4a2d-b8d9-b9749eb1470c', '09d959b6-861c-440b-89b9-bc9f7ec41ba3', '9592c3f0-7cc6-4178-9fd4-d5b12a2c7165']","['video-processing__4pxs5Ep', 'video-processing__q5cp7Lz', 'video-processing__wBtoGZe', 'video-processing__2PwWtPL', 'video-processing__9FYDnC4']",0,"[208.550899, 82.390943, 742.73969, 67.720195, 370.757384]","[62.872195, 12.145253, 33.195701, 107.327004, 40.159607]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,vulnerable-secret,5,"['2a08416e-f896-4c8d-ade4-91265fcb5079', '6a1aa59a-44c7-4f6c-9cad-4cdcf271d4df', 'da528a2d-7a4f-483b-b4ef-844a2a4da5b2', '9ef3a495-c9ee-45d7-819c-c274a66a64c4', '1be10523-5c7d-4e16-8107-ea9159eaeadc']","['vulnerable-secret__2h5Ae49', 'vulnerable-secret__6c2v2CG', 'vulnerable-secret__AD7pbKG', 'vulnerable-secret__2kLGkiM', 'vulnerable-secret__CahfYHs']",0,"[286.823811, 302.983967, 97.466118, 908.632177, 142.002919]","[52.272073, 81.932103, 13.099107, 14.090519, 10.820059]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,wasm-pipeline,5,"['4e2e041a-ab53-4e39-8033-020674a4e5de', 'b58be45c-0809-467d-8110-458d5c47422f', '4b1d74f6-94ca-45fd-8ce6-c34ef716ed70', '182654d0-a890-44f5-a277-3fc3ec0e945b', '96d1b96b-e346-4460-a737-a4d5f73c8e8a']","['wasm-pipeline__yq6Bftx', 'wasm-pipeline__PBg4YkE', 'wasm-pipeline__JsyfLtu', 'wasm-pipeline__LvcME62', 'wasm-pipeline__6wzch56']",0,"[138.191678, 541.587887, 86.213469, 108.523803, 573.818803]","[69.693567, 3.996184, 42.831258, 3.998723, 5.313385]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,winning-avg-corewars,5,"['8993c076-aa77-4659-80e7-3b742204c767', 'deaee93e-694c-4911-bf71-32e8ba278a59', '871eadef-c259-4879-9160-9b893e0a0907', '9a906fc2-4488-481e-963a-ffa0e26868ed', '6f2f91a4-6cc5-40c6-b7ff-dddfbe67367c']","['winning-avg-corewars__2qYAUQg', 'winning-avg-corewars__PocxuGt', 'winning-avg-corewars__QiXyLHV', 'winning-avg-corewars__QuaiaLR', 'winning-avg-corewars__zyjTt6g']",0,"[777.603079, 1622.418055, 585.866595, 410.815988, 543.182002]","[23.694544, 84.288235, 4.336506, 4.242733, 5.059278]",0.0,False,[] +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,write-compressor,5,"['eb19de81-6235-4257-9e0f-26468b1e4d7f', 'db5b5d4b-0dda-450d-85f5-dc573787c304', 'eebfbd38-57e9-4bde-82db-d613e109da51', '67323d2f-7b71-4ebf-9a3c-8a246dcb1522', 'a73ec9f9-2613-4db3-9a4b-ea2e4d0a271c']","['write-compressor__kXi56st', 'write-compressor__VEsJGAw', 'write-compressor__yz76hF2', 'write-compressor__XVYMTSX', 'write-compressor__L9nv8f7']",0,"[59.24247, 306.709834, 951.187845, 904.193577, 1205.02096]","[24.76756, 101.648634, 133.34807, 137.797905, 828.262534]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,adaptive-rejection-sampler,5,"['d03e12ad-c390-48a4-a362-91ee2387ff17', '3678bd85-6fd1-44a1-a741-2bd13d1bfd43', '39bb1cc9-64bf-48c5-b4ba-488d0b480755', '805ae946-1ad2-49ee-947f-3beb0cc852ea', 'de00bde2-f409-45d1-88d7-a6c4673035ff']","['adaptive-rejection-sampler__BhPzAcv', 'adaptive-rejection-sampler__KwGddB7', 'adaptive-rejection-sampler__gTKkETk', 'adaptive-rejection-sampler__PXNscXg', 'adaptive-rejection-sampler__iYQ25Km']",0,"[903.530692, 900.33538, 900.040032, 909.112255, 912.518545]","[57.05896, 87.927658, 20.896812, 66.311701, 32.140381]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,bn-fit-modify,5,"['cc708231-824a-4d53-9b07-ae7b75e66a77', 'e7c1926a-9ebd-4f80-afe1-ac4f395b4824', '05bbbced-8720-43a2-adef-4c5b1a365b3f', 'bdd8a5cd-0329-4b93-b729-cc2be43efd06', '7aa3cb3a-60fc-4cf0-bcd2-b47eb8c01aa0']","['bn-fit-modify__rdMECEQ', 'bn-fit-modify__Ua53oPz', 'bn-fit-modify__hh7vTLU', 'bn-fit-modify__242oni3', 'bn-fit-modify__pjDFu7g']",0,"[2868.985022, 1182.862434, 498.761609, 927.795137, 1260.241971]","[166.306918, 101.499679, 42.057777, 110.091279, 202.81665]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,break-filter-js-from-html,5,"['f054b6f0-946d-4feb-8b7c-5b2d85fe5ead', 'dbf42741-22a3-484a-aea8-586d8771719d', '24e5a5c8-a6fb-4a4d-a194-bcdc461d7e94', '91f1ca39-a09b-4c21-9c8d-92f41dd28a87', 'ec2cfd39-9f07-4302-88c8-e67fe228657f']","['break-filter-js-from-html__N7nju7u', 'break-filter-js-from-html__NQbqzsL', 'break-filter-js-from-html__uPXQL8w', 'break-filter-js-from-html__r5EtEga', 'break-filter-js-from-html__TsyvdYT']",0,"[1223.14811, 1214.264073, 1200.199585, 1207.503912, 1235.606973]","[103.897058, 36.249291, 13.18143, 32.494951, 116.835158]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,build-cython-ext,5,"['0fd3a1d6-910d-42ef-8bfd-b447bbb9a98d', '7a63d8dc-80c5-45af-ae0b-cb781a904349', '09a56d5c-89e8-4256-b590-c3fee3bd55c8', '5f96c7f8-c590-4f5b-a61d-dae288a58ff9', 'ef6066a3-c2a6-4abf-8e63-0af602aa0257']","['build-cython-ext__YJHpaKP', 'build-cython-ext__Haa56Uc', 'build-cython-ext__LA8XKtE', 'build-cython-ext__89AbC73', 'build-cython-ext__6Z8zmf9']",0,"[792.514784, 802.605653, 745.966361, 907.262655, 913.170316]","[66.049274, 130.234065, 35.466834, 122.132186, 34.045476]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,build-initramfs-qemu,5,"['34334893-efad-4109-9784-d0245a0a8599', '3571d2e4-6aa9-4289-bf01-10cc763e75e9', '9dfd5c5f-a61c-4daf-9bdf-5643c5ae6a7a', '0db59121-da44-4a2f-b202-6d8eaff52d5d', '6834953e-7cff-43f5-88c4-5a6610030470']","['build-initramfs-qemu__hnzZNvY', 'build-initramfs-qemu__gAGtzvL', 'build-initramfs-qemu__44kDezq', 'build-initramfs-qemu__zMPHYWb', 'build-initramfs-qemu__JnHcJrG']",0,"[907.024987, 328.104842, 526.349524, 352.566952, 528.755006]","[25.820147, 51.861317, 50.186309, 39.161409, 102.597644]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,build-pmars,5,"['0f6ed156-2a7c-4e1b-8af3-130ee219fca8', '34d09eb7-be5c-4b41-8823-ac82595bd8bb', 'b0d2d742-b0f4-442e-911b-6f133cb25a14', 'e10ed5a2-5699-42b3-b392-0b39b79731fa', '58b0e2fb-6981-476a-8664-4ae1db2569d2']","['build-pmars__kvbBwsJ', 'build-pmars__2c465yF', 'build-pmars__CAAkYHu', 'build-pmars__ENn3rP5', 'build-pmars__9kegwbB']",4,"[773.995493, 669.615436, 2011.660821, 749.380596, 565.936369]","[14.089589, 19.603637, 9.502591, 39.656061, 2.126092]",0.8,True,"['0f6ed156-2a7c-4e1b-8af3-130ee219fca8', '34d09eb7-be5c-4b41-8823-ac82595bd8bb', 'e10ed5a2-5699-42b3-b392-0b39b79731fa', '58b0e2fb-6981-476a-8664-4ae1db2569d2']" +moonshotai/Kimi-K2-Instruct-0905,build-pov-ray,5,"['6817b652-2442-42d8-8e5e-1c98b65b7a39', 'ccd7f8f1-eac1-492b-b061-23898aa8af24', 'cad37194-b58f-458f-a779-5f3b984bc7fb', 'fa5d53e1-5fee-4256-bac0-d7ffbc7100b8', 'a3ccf7a6-342a-4b03-999c-06f91aac4bcc']","['build-pov-ray__6cTNumt', 'build-pov-ray__NGJ9h3J', 'build-pov-ray__WSKECee', 'build-pov-ray__ZNRYmkC', 'build-pov-ray__JTWz4Rt']",5,"[986.831139, 3975.188471, 1779.940368, 1080.864159, 1247.643931]","[47.588353, 110.882461, 39.210116, 36.133887, 67.491769]",1.0,True,"['6817b652-2442-42d8-8e5e-1c98b65b7a39', 'ccd7f8f1-eac1-492b-b061-23898aa8af24', 'cad37194-b58f-458f-a779-5f3b984bc7fb', 'fa5d53e1-5fee-4256-bac0-d7ffbc7100b8', 'a3ccf7a6-342a-4b03-999c-06f91aac4bcc']" +moonshotai/Kimi-K2-Instruct-0905,cancel-async-tasks,5,"['c41afec4-6ea4-42fa-b4df-75657ceb36f4', 'e94f9f0c-e177-43cc-8b77-8abd50be1b02', 'e1a62e76-4b7c-4a2a-96ce-5be16a5e5084', '2d94aae1-15e3-4a1e-ba0d-0e98c96d3c94', 'b1f60041-2da9-4b86-9269-bd16f9fd9cf8']","['cancel-async-tasks__PNJrLMy', 'cancel-async-tasks__zNEtuyp', 'cancel-async-tasks__BghVCGR', 'cancel-async-tasks__cAZnDLF', 'cancel-async-tasks__xDjLXeL']",3,"[131.481846, 405.314407, 896.774426, 289.044358, 231.979442]","[38.31693, 60.362086, 175.17596, 78.158113, 63.405127]",0.6,True,"['c41afec4-6ea4-42fa-b4df-75657ceb36f4', 'e1a62e76-4b7c-4a2a-96ce-5be16a5e5084', 'b1f60041-2da9-4b86-9269-bd16f9fd9cf8']" +moonshotai/Kimi-K2-Instruct-0905,chess-best-move,5,"['3984abde-a929-4da4-8b97-2d5d94c2b6c6', '2a604b79-7fec-47d4-8ad4-a79ab9d46ac3', '92666a36-d44e-4dad-9bab-d1f3563a4938', '374c0fa7-66c5-4562-a639-ed253a56d108', '074a4b05-2421-4030-b5f8-f088add70539']","['chess-best-move__ncKDkoH', 'chess-best-move__SmRT7o9', 'chess-best-move__s3XZUiN', 'chess-best-move__6B7dR8W', 'chess-best-move__ehXAVLk']",0,"[471.861006, 559.726776, 773.527844, 900.02618, 907.607489]","[8.767876, 13.416593, 340.217634, 36.836226, 99.511208]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,circuit-fibsqrt,5,"['a7434d54-fed2-489c-aaf5-de9db27742a5', '7aece6b0-620a-43e7-9e71-3097b912639b', '625cfd07-98f0-476d-bca7-95a46f4521fe', '09713cbb-464c-464f-bfa9-dbee1168de13', 'f14077fe-ccb2-4a70-b35f-a01dbd819a7a']","['circuit-fibsqrt__ghKpk2m', 'circuit-fibsqrt__m4AM7U3', 'circuit-fibsqrt__kJ9k3CZ', 'circuit-fibsqrt__AQVhtHj', 'circuit-fibsqrt__ciFZt5p']",0,"[3615.434352, 1391.303329, 1370.503314, 2370.808709, 3624.453492]","[42.84543, 23.688281, 14.655305, 13.399629, 162.096903]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,cobol-modernization,5,"['404fa14c-bdc6-4a87-9fcf-46b988f4ced9', '4c25ebc8-f90f-461c-822e-c2bc870ee96b', '3a29b6e7-1db4-4554-b6c0-99d82106a63f', 'c852d816-d4fd-432f-b502-aae29519c613', 'ede3a59d-a84a-42c1-87ea-d41aae22b464']","['cobol-modernization__bJNJagz', 'cobol-modernization__5KVUGVG', 'cobol-modernization__bvtNB6Z', 'cobol-modernization__RN2c6VC', 'cobol-modernization__xE7Hpvd']",3,"[919.764676, 915.755655, 900.016399, 914.722451, 902.580559]","[118.557949, 53.517977, 80.58903, 46.163061, 32.83456]",0.6,True,"['404fa14c-bdc6-4a87-9fcf-46b988f4ced9', 'c852d816-d4fd-432f-b502-aae29519c613', 'ede3a59d-a84a-42c1-87ea-d41aae22b464']" +moonshotai/Kimi-K2-Instruct-0905,code-from-image,5,"['71c7f1e5-b7e4-429c-b9bf-44731d4e12f0', 'a968c80e-1797-4174-bfd4-ce0f986e1747', 'fde7b665-7e20-40ea-9bcd-076e730aa57e', '06ea7903-4d64-4826-b17a-e0d939b40a12', '0e3bf38e-4a77-4be3-b2d5-004f8b27145b']","['code-from-image__Hms3Q2a', 'code-from-image__h6Rdyzc', 'code-from-image__ZK4x3PC', 'code-from-image__vHmzBD2', 'code-from-image__TKr45Jo']",3,"[407.311086, 124.129238, 420.224504, 1202.914415, 278.236347]","[40.306958, 48.561655, 15.761137, 51.732877, 18.987039]",0.6,True,"['71c7f1e5-b7e4-429c-b9bf-44731d4e12f0', 'a968c80e-1797-4174-bfd4-ce0f986e1747', '0e3bf38e-4a77-4be3-b2d5-004f8b27145b']" +moonshotai/Kimi-K2-Instruct-0905,configure-git-webserver,5,"['efc8bdeb-3d7c-4ef9-97e8-70d3279745c8', 'f58f6292-ae5e-4699-abb2-4a9a20f8da86', '8f39ec56-51af-497a-bd4f-235c50aa2fe0', '6730bc51-36f3-4a1a-b59c-c60bfc78b64f', 'b57d4fc9-d8d5-43d0-9d20-488b6ceff5c5']","['configure-git-webserver__sJdVT7z', 'configure-git-webserver__aT6SB53', 'configure-git-webserver__8P25Kv6', 'configure-git-webserver__8PUfLso', 'configure-git-webserver__KtjneJR']",3,"[789.772052, 369.364724, 604.730001, 915.02036, 592.978233]","[21.434389, 58.959436, 48.648035, 109.22108, 188.821851]",0.6,True,"['f58f6292-ae5e-4699-abb2-4a9a20f8da86', '8f39ec56-51af-497a-bd4f-235c50aa2fe0', 'b57d4fc9-d8d5-43d0-9d20-488b6ceff5c5']" +moonshotai/Kimi-K2-Instruct-0905,constraints-scheduling,5,"['82ec03ad-af46-41e1-8425-3cb4a0fb497a', '18d5ce4b-d83a-4733-b994-91112c211f11', 'ebfa2537-798b-4756-b92b-bb9b40642e94', '9a7afbcd-4b33-4d6f-9820-044158f8f40d', '01162b33-c7cb-4566-9660-b8fa4f34d8d6']","['constraints-scheduling__7FR3VCX', 'constraints-scheduling__MNU2GFh', 'constraints-scheduling__fgpQQKg', 'constraints-scheduling__ak7B4wP', 'constraints-scheduling__KyeccWP']",3,"[360.88604, 474.385982, 601.522393, 424.373953, 199.944679]","[134.322799, 36.214711, 173.866308, 50.247968, 12.510977]",0.6,True,"['18d5ce4b-d83a-4733-b994-91112c211f11', 'ebfa2537-798b-4756-b92b-bb9b40642e94', '9a7afbcd-4b33-4d6f-9820-044158f8f40d']" +moonshotai/Kimi-K2-Instruct-0905,count-dataset-tokens,5,"['f024c09f-67a1-4fdc-9db6-8853dacca02e', '89055f67-1b67-40b3-bdf9-97efb99e91bf', '40e7bb68-125a-4b22-818a-99f6f388619c', 'd5b82da5-ddac-41dc-8340-203c197abeec', '9854421f-bc1a-4372-85fb-60f5ebdfe4fd']","['count-dataset-tokens__HriDyZk', 'count-dataset-tokens__xzQ3EDb', 'count-dataset-tokens__vrLEHNX', 'count-dataset-tokens__FeBzb5a', 'count-dataset-tokens__3VxdFv2']",1,"[564.917355, 729.314036, 850.509198, 938.349622, 322.131671]","[16.990992, 31.896635, 49.431667, 97.854437, 99.847223]",0.2,False,['40e7bb68-125a-4b22-818a-99f6f388619c'] +moonshotai/Kimi-K2-Instruct-0905,crack-7z-hash,5,"['1a58bf97-4d56-4c0b-8576-585d0a72d078', '1934a47d-4788-4c63-a85c-f9989722939e', 'f77f28fb-a961-40c6-8b27-8f86b2401dc3', '1ee1a670-cbb8-4ae4-a2d1-8d889395b622', '3eacad70-53e6-47f6-97d1-0e61be9d806f']","['crack-7z-hash__qmWDDKe', 'crack-7z-hash__ZZNqX96', 'crack-7z-hash__sDZacdK', 'crack-7z-hash__ceHP7Nh', 'crack-7z-hash__C7idm2t']",5,"[312.902691, 290.86407, 309.726764, 406.804382, 598.225772]","[11.049948, 15.835954, 144.069677, 37.096541, 27.36721]",1.0,True,"['1a58bf97-4d56-4c0b-8576-585d0a72d078', '1934a47d-4788-4c63-a85c-f9989722939e', 'f77f28fb-a961-40c6-8b27-8f86b2401dc3', '1ee1a670-cbb8-4ae4-a2d1-8d889395b622', '3eacad70-53e6-47f6-97d1-0e61be9d806f']" +moonshotai/Kimi-K2-Instruct-0905,db-wal-recovery,5,"['b85060d9-03a4-4ffc-9d45-20e52f5e6f1b', '5790beb7-d658-460b-9988-92d5ad239da9', 'bd2ae3a3-ae0c-45d4-8537-dd0755ab7dfd', '327719e8-f7ca-450a-a2b4-7816903ae765', 'f9ac8190-0d0d-4692-9176-e63a23affec3']","['db-wal-recovery__5noynko', 'db-wal-recovery__dTdYiws', 'db-wal-recovery__d9XJpau', 'db-wal-recovery__npnmHhm', 'db-wal-recovery__eVVLFkK']",0,"[303.838788, 957.637056, 910.921974, 127.840978, 519.020555]","[9.48224, 14.00535, 62.069592, 15.624396, 80.666545]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,distribution-search,5,"['c7ce51aa-46ee-48b7-babb-5fc0562d9331', '68c94c50-4321-4aee-991b-80bad70c0e66', '85ccd1dc-8474-4311-8f5b-4d7e22ac6358', 'c54620ba-5fde-47c0-a0d0-707b57e59589', '4ffbb745-91b7-425a-b06b-d697df5bb683']","['distribution-search__QwHnSo7', 'distribution-search__mZPeiGr', 'distribution-search__A62JMRa', 'distribution-search__ZrbvQSj', 'distribution-search__zWkh8E3']",1,"[1127.574018, 582.754334, 1894.392897, 1642.710512, 2767.392332]","[78.614327, 55.212158, 42.688813, 206.541131, 126.979995]",0.2,False,['68c94c50-4321-4aee-991b-80bad70c0e66'] +moonshotai/Kimi-K2-Instruct-0905,dna-assembly,5,"['98d2a0be-9a5b-43a5-a75f-6680a60e9d28', '3c51cb50-3450-4ca4-bcb2-38581be30242', 'f77a0798-df34-4780-9760-8a0e9238c37b', '415a3ca5-14da-4beb-88e7-7b0fe89797df', 'e495ed63-5774-4d09-9924-8284d438715b']","['dna-assembly__2UNSNkK', 'dna-assembly__w7PEJja', 'dna-assembly__Re83USB', 'dna-assembly__eBdpXW7', 'dna-assembly__M4DBMmp']",0,"[339.335305, 738.702978, 744.495063, 720.409605, 618.855287]","[61.013403, 35.762128, 40.499897, 27.776737, 51.024902]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,dna-insert,5,"['d2cc7b3a-fb7f-4e08-ba54-9d0c3c11d2cd', '5ac1cc5d-2751-4eae-a5d9-96a4da87c5c4', 'fbf21dcc-dc60-4165-9d8f-be4331582349', '8e52bf68-bce6-402d-a94f-b0bd3feabb37', '4c87580d-0abf-4283-b736-01f5cbf60a14']","['dna-insert__4pqkP7x', 'dna-insert__6YbwLdX', 'dna-insert__3V2fJSC', 'dna-insert__gwKoU6S', 'dna-insert__MxdJnFj']",0,"[360.00195, 417.386783, 380.849063, 372.595116, 361.154423]","[355.128591, 37.119588, 16.505014, 80.763232, 68.822001]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,extract-elf,5,"['b35b8bcf-1cd9-44f8-9f2c-ae9cc35c67c0', 'eceb3b8d-e720-4f5a-8312-e29233f9626a', 'e7ca6a41-bd23-43cc-85ad-03017aed676a', 'fd49775d-337b-4213-86d0-f821857e7099', '76aa9bb2-cb8f-49bf-af06-aa17a0b6020d']","['extract-elf__SNYviL9', 'extract-elf__nYkF3Zr', 'extract-elf__6PrDyJP', 'extract-elf__6LgcuFV', 'extract-elf__Hcd3AYf']",3,"[559.724871, 355.680177, 900.000923, 555.879275, 536.281287]","[24.402262, 135.029752, 92.852315, 48.055433, 28.38502]",0.6,True,"['b35b8bcf-1cd9-44f8-9f2c-ae9cc35c67c0', 'e7ca6a41-bd23-43cc-85ad-03017aed676a', '76aa9bb2-cb8f-49bf-af06-aa17a0b6020d']" +moonshotai/Kimi-K2-Instruct-0905,feal-differential-cryptanalysis,5,"['d2f56d4a-6033-4142-9262-4f6b7063741e', 'e3ade6ea-eb25-46fe-b73e-f23c923b94fc', 'eb6bc6bc-0941-4e03-8ae8-6fc3a3941013', '7e0cf1d1-6a8c-464c-9cdc-1fef9e8c66fa', '52705aba-dec6-4cae-8008-119f574f53d3']","['feal-differential-cryptanalysis__opVD5d2', 'feal-differential-cryptanalysis__gqyKPTS', 'feal-differential-cryptanalysis__tHvLvdM', 'feal-differential-cryptanalysis__ozqw2tu', 'feal-differential-cryptanalysis__xHV7UnX']",0,"[1808.40788, 1299.273454, 1800.032216, 1271.928934, 1818.796497]","[36.189993, 239.254697, 75.4711, 95.79668, 24.160043]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,feal-linear-cryptanalysis,5,"['17ea7461-db60-4a35-ba2f-794a9f8f472f', '4d787dea-0d61-4670-bdaa-ae25753d3785', '3d697603-9e53-456b-91ce-e7619363c6b2', '2a577057-8f4d-4baf-8141-afd3b3311534', '7d4e9777-04ea-4eab-8112-37b33c3434ac']","['feal-linear-cryptanalysis__ZCaFaXP', 'feal-linear-cryptanalysis__QxTQvoy', 'feal-linear-cryptanalysis__EryUBGv', 'feal-linear-cryptanalysis__h9YgieW', 'feal-linear-cryptanalysis__9jw7yj2']",0,"[1819.80891, 1805.750966, 2443.52322, 1830.016618, 1810.122203]","[44.069776, 160.144981, 20.160482, 34.388217, 21.741866]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,filter-js-from-html,5,"['b0cd3510-5146-4a50-bafb-7da7c09654c5', 'f2c36357-3159-4844-aabd-58c4159f957d', 'c329d066-2cdf-4f52-af72-b07fb06f3e3a', '93e21952-23fc-4698-9919-a843da9ee341', 'c201cda0-1d24-47f2-a9f9-80f79aadf5d6']","['filter-js-from-html__VQoJUQp', 'filter-js-from-html__CA3oQSn', 'filter-js-from-html__KY8fCZQ', 'filter-js-from-html__nsyrsoh', 'filter-js-from-html__r67awm2']",0,"[707.178394, 746.395909, 579.247683, 335.55509, 775.028371]","[22.380515, 62.065129, 24.322063, 47.579942, 38.380604]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,financial-document-processor,5,"['88f73130-4828-4fdf-9c42-75e7d1c2f818', '1546dec3-a5bd-4408-8c67-4725f6501921', 'acbe80b2-aabe-4c09-aae7-6905c0c66816', 'cc51af98-1dce-45a1-8249-d05c8445e2f6', 'aaf3fe24-154a-47da-afd1-23768c05d30e']","['financial-document-processor__64pNyit', 'financial-document-processor__4X5Rfn8', 'financial-document-processor__Re5rcdV', 'financial-document-processor__QewwXK7', 'financial-document-processor__DNhp6tb']",0,"[1204.663633, 392.163094, 538.449639, 1175.052338, 650.56219]","[29.407857, 48.406481, 102.22958, 199.902133, 18.627523]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,fix-code-vulnerability,5,"['55680f76-afa8-44ed-9c35-8450c50286fd', '196c9b7a-0588-4921-906f-2f3b13dc9920', '916bc4b9-9649-495e-9f85-0f81271cf830', '982f680a-a55a-4e5d-abf5-e152f7562d3d', '496cbc61-7ef3-420e-8263-34a5b82b2108']","['fix-code-vulnerability__AFaiMYL', 'fix-code-vulnerability__EmuFwZX', 'fix-code-vulnerability__rnoXkW9', 'fix-code-vulnerability__mZHhp49', 'fix-code-vulnerability__7yUHhJU']",0,"[930.576183, 592.381116, 900.037763, 900.129505, 1011.764671]","[36.313752, 44.046213, 12.466346, 52.50562, 10.99347]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,fix-git,5,"['f24bd6b7-733a-493d-976c-c9cf80698bf4', '235e0bdf-a8ec-4ba4-9444-3ea33cdb0071', '881a261a-9ddc-4050-acbd-de862f6c5851', 'ae480f5e-5805-4eff-b63a-8e4b404112bd', '6188bac0-4578-4117-a337-68845fdbf8f6']","['fix-git__jyM6H2B', 'fix-git__afGVbHD', 'fix-git__Eswm77N', 'fix-git__348GjPm', 'fix-git__DzRXuCw']",5,"[347.422022, 897.086075, 328.626363, 336.181738, 319.100462]","[13.291785, 11.94375, 47.301934, 27.600888, 17.524125]",1.0,True,"['f24bd6b7-733a-493d-976c-c9cf80698bf4', '235e0bdf-a8ec-4ba4-9444-3ea33cdb0071', '881a261a-9ddc-4050-acbd-de862f6c5851', 'ae480f5e-5805-4eff-b63a-8e4b404112bd', '6188bac0-4578-4117-a337-68845fdbf8f6']" +moonshotai/Kimi-K2-Instruct-0905,fix-ocaml-gc,5,"['2cf7f8b8-3f04-4ddc-9928-1526e9691f0b', '55446577-2f3e-4f12-81f9-62ba0335484a', 'd87a57cb-03bc-4e85-a348-bebe3b803185', '8172a25e-7b9b-4e90-b167-592f75300151', '348e38d8-e712-448a-a243-1c9723bc139d']","['fix-ocaml-gc__UXodcug', 'fix-ocaml-gc__ymPxLfq', 'fix-ocaml-gc__Pdndrjn', 'fix-ocaml-gc__7uHzSn8', 'fix-ocaml-gc__MYSiZhe']",0,"[3602.065217, 2191.174596, 1420.513525, 2332.50221, 3740.214872]","[44.776681, 43.186284, 35.677908, 83.634684, 24.234044]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,form-filling,5,"['27dd78d5-f4f2-493c-8ee1-f0c75fb92e88', '4494df2c-3164-4d38-82e4-efe499bf9d84', 'e14921d8-3dcc-4de4-8966-81852fc9304b', 'c4d4b96e-1911-4eb9-9763-44bf668f7a4f', 'd1b635f8-0053-4f51-9a24-f4275356c3d4']","['form-filling__8GiQRUn', 'form-filling__PNbchLc', 'form-filling__Pb4RN4r', 'form-filling__gWyckHP', 'form-filling__NQWrAz9']",4,"[327.209381, 397.287931, 676.929552, 347.424744, 467.072363]","[3.283513, 8.914183, 43.468131, 5.606395, 86.33581]",0.8,True,"['27dd78d5-f4f2-493c-8ee1-f0c75fb92e88', 'e14921d8-3dcc-4de4-8966-81852fc9304b', 'c4d4b96e-1911-4eb9-9763-44bf668f7a4f', 'd1b635f8-0053-4f51-9a24-f4275356c3d4']" +moonshotai/Kimi-K2-Instruct-0905,git-leak-recovery,5,"['0e79fa68-6f33-46be-92fa-282233ca20e8', '701cfce1-6a2c-4cc5-9905-fb5bd12c66d2', '01d83249-77ec-4931-b12b-4805b6ea004b', '1354cfe7-e4c7-4885-ac40-12d8b56e40be', '11670a27-f9ea-4496-9c8c-4b9e04cdc3cb']","['git-leak-recovery__GQX3bbJ', 'git-leak-recovery__viojuzv', 'git-leak-recovery__ucq4A7e', 'git-leak-recovery__jZnHGf9', 'git-leak-recovery__2wfVfhj']",5,"[266.738993, 268.991108, 169.975227, 241.844258, 920.543412]","[141.512821, 42.589696, 183.138168, 53.284138, 37.173964]",1.0,True,"['0e79fa68-6f33-46be-92fa-282233ca20e8', '701cfce1-6a2c-4cc5-9905-fb5bd12c66d2', '01d83249-77ec-4931-b12b-4805b6ea004b', '1354cfe7-e4c7-4885-ac40-12d8b56e40be', '11670a27-f9ea-4496-9c8c-4b9e04cdc3cb']" +moonshotai/Kimi-K2-Instruct-0905,gpt2-codegolf,5,"['235287e7-1b7d-45ec-a9d6-16275623fa2b', '651d6c3f-f87b-44c7-9bfd-e13ff2cace3f', '61675f35-6b20-4de5-ac87-ff924acc7bdf', '319f5b4a-1bdf-4402-8e19-2fdf06557625', '41a76398-04b5-4076-8560-be89f2676739']","['gpt2-codegolf__AMNqu6d', 'gpt2-codegolf__eE4cWZW', 'gpt2-codegolf__eUdipdG', 'gpt2-codegolf__nXWyqH8', 'gpt2-codegolf__kirYNgq']",0,"[462.656621, 905.922495, 900.028442, 662.719464, 908.112842]","[67.541928, 30.910186, 262.045732, 81.558664, 49.758768]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,hf-model-inference,5,"['8bf118f7-ad47-44a6-a584-5b16a67c7ccf', '9487c006-b3f3-46f5-aa58-db961dd0798e', '5bd5fbb1-5125-4fac-9abe-04feb78059e5', 'a400b2a4-a299-4ace-a818-7b63b51d5b64', '55abd204-1219-4a73-9d7f-63981a2c1251']","['hf-model-inference__HUXRx9G', 'hf-model-inference__WZV4ozr', 'hf-model-inference__TBTXfvZ', 'hf-model-inference__AVdkTYv', 'hf-model-inference__WRKBJGx']",0,"[403.607774, 918.51472, 683.018879, 453.037159, 686.606258]","[37.654969, 14.881937, 24.143126, 26.530544, 36.701642]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,install-klee-minimal,5,"['f46a9e2c-062e-410d-9d24-35c0e93b868f', '49a77aef-0dce-4d98-83c8-9784f2699048', '161a3789-cf56-4335-9996-f0bb26832b7a', '2ac3e485-450e-4946-9fef-22661df31e00', '702a4368-6487-486b-ad1c-75dbeec4e270']","['install-klee-minimal__gbwPAxp', 'install-klee-minimal__dj67icH', 'install-klee-minimal__A9FRfJJ', 'install-klee-minimal__yCxVrLT', 'install-klee-minimal__votRXJJ']",0,"[931.848327, 906.862312, 904.157665, 905.783931, 902.115913]","[38.629558, 71.802257, 113.230138, 21.362983, 53.503712]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,install-windows-3.11,5,"['dcbf9b3d-13d8-485e-b37b-c163f959fa15', '76d25d68-9482-42df-b78b-bc72905fccb5', '80653225-189c-49c3-9a80-239fa55a962a', '08729cc1-bb32-450c-bc9d-3d1ca07c44a8', '135185e4-0e1f-4bbc-adcc-8eca9aaea319']","['install-windows-3.11__9pWu6ry', 'install-windows-3.11__x2qwB5L', 'install-windows-3.11__jqiDBf9', 'install-windows-3.11__HQhxxMJ', 'install-windows-3.11__pvs5cZ6']",0,"[530.472989, 1271.822643, 350.44511, 249.859577, 1177.880196]","[24.420864, 13.808266, 23.55466, 45.904058, 58.660088]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,large-scale-text-editing,5,"['d9cdb001-d9ce-45ad-92ff-481a1abc6d54', '3ae214fb-fee1-4a31-a18a-4933c307580d', 'a7b3dede-597d-4ea7-8ba0-905d43e93c23', '161c701e-79d9-4b23-8d40-a22ee6984732', '2ad9b966-70af-4825-aba7-d63b3d0fd403']","['large-scale-text-editing__8FAkdLu', 'large-scale-text-editing__5kcJV6d', 'large-scale-text-editing__TUrXve6', 'large-scale-text-editing__wWRLCHw', 'large-scale-text-editing__J6wnFUF']",0,"[1211.197888, 1221.816872, 591.376498, 1245.096642, 1201.332374]","[71.79171, 146.649095, 257.050506, 16.006327, 15.136249]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,largest-eigenval,5,"['13f66ada-763e-4105-bf66-b3e4bb97a38e', 'a4b07c7e-19bc-4c3b-aac3-30770b583772', '259414e9-193c-440f-9f29-b462489cd762', '438da45e-2138-499c-960b-37923d6859ab', 'e2012e6c-2fcd-433e-8557-7618b9517708']","['largest-eigenval__7cYqC8Q', 'largest-eigenval__zFa5eWt', 'largest-eigenval__7fh3yxe', 'largest-eigenval__mdKoYj5', 'largest-eigenval__J7heFmk']",1,"[916.13923, 729.444764, 910.658507, 908.713165, 541.384516]","[179.837114, 64.583446, 126.225684, 52.440153, 51.255052]",0.2,False,['e2012e6c-2fcd-433e-8557-7618b9517708'] +moonshotai/Kimi-K2-Instruct-0905,log-summary-date-ranges,5,"['4ec37157-0f8b-459f-9961-d7312aa8a6c4', 'ed0414d2-8d05-4cd4-8499-6d9bd4dc9b94', '61050336-bb24-4ee8-94de-ce9fe730b482', 'e59a7ba4-c580-4bea-81d5-49485b946047', 'efe50b4b-77d7-4521-8cd2-cd52fd924e57']","['log-summary-date-ranges__pSgox5p', 'log-summary-date-ranges__WByV2or', 'log-summary-date-ranges__AmTeZpc', 'log-summary-date-ranges__krRxzvm', 'log-summary-date-ranges__xEKDDs2']",4,"[166.977851, 337.784765, 410.260485, 127.136382, 272.706163]","[44.80208, 29.574381, 20.508822, 16.805559, 51.462951]",0.8,True,"['ed0414d2-8d05-4cd4-8499-6d9bd4dc9b94', '61050336-bb24-4ee8-94de-ce9fe730b482', 'e59a7ba4-c580-4bea-81d5-49485b946047', 'efe50b4b-77d7-4521-8cd2-cd52fd924e57']" +moonshotai/Kimi-K2-Instruct-0905,make-doom-for-mips,5,"['836af897-cac7-46e5-8e3d-493af2a2cfd2', '2715c613-1d22-4b6f-8082-af675a5fe2a2', 'd8bb51cf-591b-4add-9c91-a00e08a3bd83', '8d3b5229-627f-49e0-bc79-2690c6c1235b', '55f63ef5-dfcf-4386-9686-5be567cf5f32']","['make-doom-for-mips__ngH8szb', 'make-doom-for-mips__kGaNA2A', 'make-doom-for-mips__5MDPSgD', 'make-doom-for-mips__a6uNjxR', 'make-doom-for-mips__zZvnciB']",0,"[1002.425557, 908.134936, 908.135969, 901.27387, 907.866592]","[140.552612, 20.178647, 29.956003, 105.003057, 205.690478]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,make-mips-interpreter,5,"['2144d0be-61d2-469b-9142-825062a18ced', '84a5e354-25f2-4b2d-b56c-12fa33c19d86', '114342a0-333b-4ddc-a403-81fa9e632de9', '2746a62c-e0ac-40e2-a840-5587149d8c57', '0e5a60a4-d10f-47cc-bbd4-375468593069']","['make-mips-interpreter__UEsFcje', 'make-mips-interpreter__cJMpVsb', 'make-mips-interpreter__2awsH4y', 'make-mips-interpreter__mrVPn5A', 'make-mips-interpreter__hDjhBBp']",0,"[1843.855607, 1807.752178, 1840.534871, 1800.515873, 2108.757868]","[84.687288, 70.733264, 252.133798, 55.151528, 10.886827]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,merge-diff-arc-agi-task,5,"['1162e9e5-e3f3-4df8-a004-08c575d8b652', '8193060e-51ff-46e6-8e53-128f96fb32e3', '1e6ede1b-47b4-4d13-b977-ed246071e37a', 'b45fa4aa-8565-452f-ad00-4bdebde0cc0c', '58fa34e5-e5c1-4e85-ba33-a19c5fb072e7']","['merge-diff-arc-agi-task__QoDk9E2', 'merge-diff-arc-agi-task__tVE7YCf', 'merge-diff-arc-agi-task__GyGpMtA', 'merge-diff-arc-agi-task__X4bL7yf', 'merge-diff-arc-agi-task__8thg4vm']",0,"[904.728393, 900.884919, 889.530768, 382.938725, 907.826836]","[13.74974, 133.039146, 84.601202, 18.978391, 72.089727]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,model-extraction-relu-logits,5,"['83013d73-49df-4065-9bd3-3ffc1642e4dd', 'd7cde291-3d23-438e-ad31-2c51625e1123', '4c85aaad-6263-45ed-afdc-0df292c4a327', '2aa8a679-658b-481a-b262-42fdea09d8ed', '14bc30db-4bbd-4924-81ab-aff2e6a28629']","['model-extraction-relu-logits__iFwpNgN', 'model-extraction-relu-logits__Ec9hRzj', 'model-extraction-relu-logits__3KzucZP', 'model-extraction-relu-logits__Ji5PDVA', 'model-extraction-relu-logits__ydqfqZr']",2,"[529.043405, 843.14087, 459.288541, 486.902523, 493.51599]","[162.958041, 116.933612, 12.586843, 42.826211, 47.65661]",0.4,False,"['d7cde291-3d23-438e-ad31-2c51625e1123', '4c85aaad-6263-45ed-afdc-0df292c4a327']" +moonshotai/Kimi-K2-Instruct-0905,mteb-leaderboard,5,"['eca79125-88db-4820-a3e2-af90f96ae8d8', '18116941-f772-4f0e-8423-902d4c1c3d5b', '59a52a27-3faa-4c34-a0d1-4c318ec36dee', '607d1c62-afed-4ec5-83a5-958125d43a67', 'dda1c072-c77e-4d2a-acfa-24412c369a3f']","['mteb-leaderboard__VC269nf', 'mteb-leaderboard__F5udNsx', 'mteb-leaderboard__Xk9Eg6K', 'mteb-leaderboard__ejPSMXZ', 'mteb-leaderboard__5EgkqRP']",0,"[1342.634596, 310.186324, 2753.225711, 545.52535, 506.521827]","[54.192646, 6.042063, 4.294825, 2.346824, 3.795955]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,mteb-retrieve,5,"['5d46de94-8c27-43d6-933f-6d8adb739eef', '3b7e8481-8328-4487-a89b-81bd84ddb83a', 'f13817ec-b542-4da4-9c29-8eafe1352efe', '7e2eb257-28ac-49eb-9c18-24b2c50a5d36', '814946c3-3467-4ef8-ad1f-01a8603a594f']","['mteb-retrieve__F4V7b2y', 'mteb-retrieve__6oMmCyG', 'mteb-retrieve__9WTu54m', 'mteb-retrieve__xBffsfM', 'mteb-retrieve__LehbmHD']",0,"[436.124129, 375.925406, 247.564662, 556.153563, 254.468697]","[13.068214, 31.615802, 122.799079, 42.736558, 101.904606]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,nginx-request-logging,5,"['74a4f208-3c27-4f27-96bb-52c44f81778c', '2a7142e7-095e-4520-9798-3270a5c7f9a7', '1aae83f7-f423-4910-93f9-bbc66cb8a7dd', '5e803188-7216-4015-aab7-d930a2814045', '5c754e1c-5656-4539-9798-affc4df166b6']","['nginx-request-logging__T2pZve3', 'nginx-request-logging__7HjppiS', 'nginx-request-logging__Z7MzKEC', 'nginx-request-logging__LNaTg62', 'nginx-request-logging__RNKEuhd']",2,"[487.801388, 467.707808, 928.656158, 447.375746, 624.23191]","[14.965855, 57.97568, 80.270653, 16.145467, 110.400744]",0.4,False,"['1aae83f7-f423-4910-93f9-bbc66cb8a7dd', '5e803188-7216-4015-aab7-d930a2814045']" +moonshotai/Kimi-K2-Instruct-0905,openssl-selfsigned-cert,5,"['9d63fab6-6b80-436d-b21b-93131dc19855', 'b48e2287-c476-4880-84df-705e261f2f9c', '30aa52df-108a-41fe-9a83-b1e68ea63abb', 'b3efe4dd-ce98-4a5b-a1cd-95714af47bec', '818a5974-2f0a-49e3-8f58-dec181eed745']","['openssl-selfsigned-cert__WtsrjP6', 'openssl-selfsigned-cert__HDqHCVw', 'openssl-selfsigned-cert__WgHuRPf', 'openssl-selfsigned-cert__JwURZgk', 'openssl-selfsigned-cert__Foue9tK']",3,"[218.3977, 267.589208, 225.513232, 633.796514, 736.863069]","[27.597468, 17.464117, 15.936333, 66.397256, 53.972311]",0.6,True,"['b48e2287-c476-4880-84df-705e261f2f9c', 'b3efe4dd-ce98-4a5b-a1cd-95714af47bec', '818a5974-2f0a-49e3-8f58-dec181eed745']" +moonshotai/Kimi-K2-Instruct-0905,password-recovery,5,"['a9f5326c-69dc-4656-bd6e-cd11e2bc15f1', 'be9428a0-e800-47f4-8348-58c56cf3cd8a', '5ed3a276-5b7a-477a-88eb-07a907130ad1', '030c60e1-980a-414e-9370-01d3a19ec68a', '3634371f-5cfa-4c2e-aa9d-dfa0dec47a6b']","['password-recovery__Cx3vAr4', 'password-recovery__Nxi6yYs', 'password-recovery__TTZGZnn', 'password-recovery__4YvDLD3', 'password-recovery__U7byCyR']",1,"[575.619497, 913.523787, 752.412577, 913.513438, 900.211672]","[47.689653, 49.871564, 27.112056, 26.280146, 50.385627]",0.2,False,['a9f5326c-69dc-4656-bd6e-cd11e2bc15f1'] +moonshotai/Kimi-K2-Instruct-0905,path-tracing,5,"['1a3cec9b-b4a1-45e8-b8b6-6d957408a37a', '022aa524-d479-4a4d-b240-8b59085c88c0', '732b8070-0731-495f-9fce-82a99731db16', '40c0d6f8-4c58-45b2-87be-9a12e33f64f6', '0d745d79-1273-4963-820f-c40cec623d83']","['path-tracing__56QszhW', 'path-tracing__5SKqjzi', 'path-tracing__BdySXv6', 'path-tracing__ZY2jywE', 'path-tracing__BUfjRq7']",0,"[840.989617, 1820.851112, 1181.13938, 1101.284906, 2035.562264]","[38.145281, 30.109456, 27.48038, 26.867637, 259.055995]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,path-tracing-reverse,5,"['37a74b29-e7a4-400b-a188-aace78c0d409', 'c7c2e000-4711-495b-bfab-7d5305a3acc1', 'a8fbac2b-d36d-4234-bb76-195f2a2d49e4', '562ac434-8192-4567-ba00-414ee15d82b0', '5e7a9f58-deb8-4eee-bae4-40de303db202']","['path-tracing-reverse__uxH7Yv5', 'path-tracing-reverse__jBHvmMz', 'path-tracing-reverse__yrqE7w5', 'path-tracing-reverse__Y63n8Ji', 'path-tracing-reverse__vg3pXFQ']",0,"[588.36258, 2057.761833, 1264.466779, 737.642621, 1006.381626]","[49.577812, 26.07529, 33.004095, 34.360416, 41.535989]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,polyglot-c-py,5,"['acb1d3a5-023a-45da-90a6-3f0d90adf5cf', '7f6f52d4-ea16-4dda-a939-e97125f3c238', '2adabc36-17a7-42b8-903f-ca3a71fd34bf', 'bb850552-9147-4269-9a7f-0edb85891dee', '8da93d19-ff0e-480f-8438-88ce64b88edc']","['polyglot-c-py__4K5WAoK', 'polyglot-c-py__Gavigdj', 'polyglot-c-py__rLXGyfv', 'polyglot-c-py__efdTZtb', 'polyglot-c-py__6GdGFpG']",0,"[901.780684, 900.018897, 904.145887, 1009.323618, 632.136773]","[14.185105, 56.425574, 29.495695, 49.580035, 59.203777]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,polyglot-rust-c,5,"['0f834879-7a7c-4a93-b58d-a0151c8db4b3', '31d7385d-7080-46cc-a45d-b40493ab9aca', 'b8945bb2-965f-41c1-a835-4b2f25e4a9c8', '3ac442dd-ac18-4e95-9193-ff66942a9ddd', '989da270-4ef2-47f7-9154-9bf999730fdc']","['polyglot-rust-c__7oqX2Sq', 'polyglot-rust-c__QqdJq4o', 'polyglot-rust-c__cSiRrb7', 'polyglot-rust-c__uzQWVQk', 'polyglot-rust-c__kwVg35E']",0,"[928.712501, 921.516485, 900.006148, 903.750118, 909.688541]","[25.172921, 94.239753, 59.891946, 284.609103, 111.670921]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,port-compressor,8,"['70fe8fa7-e0a5-4062-aa04-419e348b19a3', 'ca4e8210-a4ff-40b8-afbd-5516276e3eee', 'ed42c328-f2f6-4c65-b5ca-c0a47bc9ad4d', '06db5486-4be0-4420-a5dd-06196167f155', '7ed960d8-2fa5-4dda-9db8-a167419401f4', 'd83f9dd9-f8c1-439b-84b7-01b10a3d864d', '94a160a6-b1b5-4717-8d02-3f16d21a5349', '7689d110-ab4a-4164-b225-86b4fc18c7e0']","['port-compressor__fepyt3m', 'port-compressor__AShTiNT', 'port-compressor__nEQ8Z89', 'port-compressor__uGzhkrd', 'port-compressor__pZD68qz', 'port-compressor__L5JsZ2T', 'port-compressor__KotdGaS', 'port-compressor__tLGj5Db']",0,"[2081.210711, 1299.824652, 3601.387825, 3618.151075, 3600.513314, 3600.001018, 1473.23885, 3587.103511]","[10.546171, 9.046541, 182.025789, 18.555874, 70.819555, 60.916678, 12.498026, 42.537143]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,prove-plus-comm,5,"['86a8c7a3-349a-4c60-b6b8-b52d6632fb14', 'fa031b00-8bc5-42f2-af84-2cdd01663a9a', 'c84ff7ef-2609-476d-8adc-61c58e43c6b4', 'df6e5ff7-6b56-4ecf-8e7c-f9fd7f5b4dea', '6dbde439-fda8-4773-8da3-e6ac16d5e25d']","['prove-plus-comm__QpB3gdj', 'prove-plus-comm__ajZRVhr', 'prove-plus-comm__TbV85oV', 'prove-plus-comm__YMHzrJC', 'prove-plus-comm__uXJJuXT']",4,"[89.970492, 394.415537, 901.598533, 152.285369, 684.233345]","[14.533511, 41.801986, 84.200583, 58.805654, 67.179931]",0.8,True,"['86a8c7a3-349a-4c60-b6b8-b52d6632fb14', 'fa031b00-8bc5-42f2-af84-2cdd01663a9a', 'df6e5ff7-6b56-4ecf-8e7c-f9fd7f5b4dea', '6dbde439-fda8-4773-8da3-e6ac16d5e25d']" +moonshotai/Kimi-K2-Instruct-0905,pypi-server,5,"['0ae49add-4c2e-4767-ad43-36288de6dda9', '1a96515e-cd03-4409-b6c9-f5529def8d50', '595d1939-2424-4366-bd42-beedd35b8b32', '961d6353-b25e-411f-b7a5-a4df1af2ffaa', 'a676c26e-9136-409d-90ad-eed7566362db']","['pypi-server__NXXXAj2', 'pypi-server__UJWQgpR', 'pypi-server__SXYm6Fj', 'pypi-server__fepkj7H', 'pypi-server__bCK2jU8']",1,"[910.536401, 667.874785, 793.433323, 249.04196, 761.406198]","[43.29378, 35.510825, 43.087308, 52.039426, 14.300251]",0.2,False,['595d1939-2424-4366-bd42-beedd35b8b32'] +moonshotai/Kimi-K2-Instruct-0905,pytorch-model-cli,5,"['9a73c9f9-f9a9-4663-bb81-f19141d6e5c1', '7a808293-9462-4801-a4c1-6f289c5ac9c2', '59c802b1-0442-4c9e-80d7-6a433ca26c60', '7c0bb66a-fee2-44a9-a795-ce9b141e0eab', 'ab82794a-3124-4596-bd81-d6fa1747519a']","['pytorch-model-cli__DaXSBhN', 'pytorch-model-cli__vaxmQeT', 'pytorch-model-cli__gXAWCHb', 'pytorch-model-cli__PvQ3Y3e', 'pytorch-model-cli__Zdekgjv']",0,"[411.493578, 650.269341, 384.687979, 941.911409, 839.393672]","[134.027991, 61.030558, 46.579003, 35.090026, 33.728231]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,pytorch-model-recovery,5,"['81369027-9010-458b-af5b-d5ac49bcb60d', '6004a4b8-5eec-43eb-b873-52da8fd9381a', 'aca9a3cf-9a3f-4780-88e8-ed725137a1ec', 'd564e1c7-5dd3-47f3-8f3f-040ebdf8350d', '5334ce1c-e444-440d-91b1-dad213c1a1f9']","['pytorch-model-recovery__p4iFrEJ', 'pytorch-model-recovery__4aU3drg', 'pytorch-model-recovery__gU8Desc', 'pytorch-model-recovery__cCbDjpM', 'pytorch-model-recovery__YSDMa6N']",2,"[912.948684, 900.051785, 750.217438, 901.315843, 914.338319]","[62.327445, 37.682139, 43.354051, 73.94469, 11.865706]",0.4,False,"['81369027-9010-458b-af5b-d5ac49bcb60d', 'aca9a3cf-9a3f-4780-88e8-ed725137a1ec']" +moonshotai/Kimi-K2-Instruct-0905,qemu-alpine-ssh,5,"['dbeaa5ee-5fbf-4e66-aab3-219ad58bfe1e', '71183fc6-dbc9-46fb-8701-f0cc89b75a0e', '71b22a5b-0aca-4179-b08d-e6f251152f28', '665dc520-f100-4932-b763-60cd5f16ef59', 'b6431da8-b59c-4ca3-8628-25ea57598183']","['qemu-alpine-ssh__AVBpza7', 'qemu-alpine-ssh__NzkF35n', 'qemu-alpine-ssh__6ZasmbC', 'qemu-alpine-ssh__Qd8pXyZ', 'qemu-alpine-ssh__ehYtwTi']",0,"[903.037901, 900.26263, 238.972082, 1044.974533, 904.611802]","[41.353781, 4.620959, 4.969112, 4.366165, 27.876339]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,qemu-startup,5,"['2e1d3012-18d7-4b49-93c9-b35f1ffe3518', '737b8cc3-5e2e-468a-a50d-a22ee642b7fc', 'a32654a9-5819-4eeb-bc8e-c5ab09e6281a', '13b4dd5d-b1f8-4e05-9fb3-6163378efb24', '4bc89ec1-a3be-490a-81e7-69826af76afe']","['qemu-startup__kRtt6T4', 'qemu-startup__5TAboYM', 'qemu-startup__b8KAgez', 'qemu-startup__yxQME3W', 'qemu-startup__jYFxjtZ']",2,"[1012.517922, 146.083293, 344.061338, 224.649714, 937.207314]","[6.421041, 18.7972, 10.630923, 4.615391, 9.34078]",0.4,False,"['737b8cc3-5e2e-468a-a50d-a22ee642b7fc', '4bc89ec1-a3be-490a-81e7-69826af76afe']" +moonshotai/Kimi-K2-Instruct-0905,regex-log,5,"['70ad6e7e-f0bc-4bc8-9645-13f49bb4aed2', '415e363c-8a81-4ce3-98a9-52cd0be7d093', '1356f66c-3dd3-4172-a61e-bed038adb22f', '0c694af2-29c8-46f1-8ce4-744ece309e29', 'dac4d51e-b35e-4398-99e6-6633dde32d0e']","['regex-log__fapHPyq', 'regex-log__Exo6Q8D', 'regex-log__E5vd62J', 'regex-log__MFbi8mg', 'regex-log__sfCTDfP']",2,"[845.755794, 272.557405, 674.1976, 375.161949, 303.677945]","[114.314306, 133.295517, 166.094069, 190.611473, 77.45902]",0.4,False,"['70ad6e7e-f0bc-4bc8-9645-13f49bb4aed2', '0c694af2-29c8-46f1-8ce4-744ece309e29']" +moonshotai/Kimi-K2-Instruct-0905,reshard-c4-data,5,"['51ea6191-fce2-412a-97c5-eeaefe0c14aa', '1db09e50-1b46-4805-89d6-334e42b3459e', '7713e6c5-4b75-44d0-8ea9-eb813fb08e53', '0918ce2f-0772-4f77-95d3-0bc08cc319d1', 'e251ab03-2b20-48d3-8c5f-8ca18e6de1a8']","['reshard-c4-data__He5qbkh', 'reshard-c4-data__s8nUfuY', 'reshard-c4-data__ikhQ3eE', 'reshard-c4-data__MQ7UUMA', 'reshard-c4-data__rDZEZ5u']",0,"[518.070317, 717.6119, 403.226755, 1786.932415, 448.617127]","[66.376353, 214.681234, 19.777865, 44.047193, 97.990832]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,reverse-engineering,5,"['7a49235b-1b2f-484d-921b-9ea63dab8d0f', '438fdb9a-f5fd-4e7a-937d-0dddb51d9a7f', 'd867c87b-0ff2-457c-8f8e-abf34cd9e4a7', '33f71961-78c3-4225-a260-731a037cb298', 'ba0b2cd9-beb9-4194-bd78-8d28ceba0bcc']","['reverse-engineering__wgXcWn4', 'reverse-engineering__83yVyU7', 'reverse-engineering__MBXGhWn', 'reverse-engineering__KewZSoL', 'reverse-engineering__PTWe2Z6']",1,"[328.351121, 2550.101008, 1801.947719, 1811.558149, 1800.048259]","[47.707888, 27.808088, 16.635542, 46.62762, 37.46004]",0.2,False,['7a49235b-1b2f-484d-921b-9ea63dab8d0f'] +moonshotai/Kimi-K2-Instruct-0905,run-pdp11-code,5,"['127905a6-5f28-4f57-b60c-99a8363c42f5', '00090459-c21f-452f-a6e4-d5d5847522e8', '91c244c5-c83d-4a36-b897-31b0236caa8a', '9214016a-12d3-47ad-903a-53708eea5210', '4a33b7a6-70b5-42b3-a6d7-226993fdae2a']","['run-pdp11-code__6aDCJQF', 'run-pdp11-code__mk59JEN', 'run-pdp11-code__Gy6Pmw2', 'run-pdp11-code__cnM45gD', 'run-pdp11-code__Fhmj7LE']",0,"[1004.523248, 681.128358, 1001.317613, 1006.292308, 1000.030553]","[131.992211, 21.056462, 162.296984, 68.966569, 65.564929]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,sanitize-git-repo,5,"['7719f772-f6ea-4bc5-b035-970d7c57a200', '115fe85d-e11d-4e77-8ee0-bcf687ab1799', '2c08e10c-8327-4666-999f-d81220e36c00', 'ee1c65b2-caaf-4e4d-81bd-bb2e7cba0ca4', 'bef2dad9-a5a6-462e-a0cc-7fc252b2d3cf']","['sanitize-git-repo__g92CDLJ', 'sanitize-git-repo__ckk8ZFt', 'sanitize-git-repo__rv5C4aA', 'sanitize-git-repo__EXBWo2n', 'sanitize-git-repo__Ujjz22t']",0,"[602.871666, 656.610933, 410.238054, 1005.461702, 705.372478]","[37.663743, 53.530868, 330.057722, 289.9723, 14.437377]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,schemelike-metacircular-eval,5,"['967cf96f-8ea3-4075-86f3-3fbf3594e5c7', '7f6f3ec3-d1e6-4cc1-a252-4204d75ebba1', '382de16c-b539-434b-83c0-a43a4e354b0b', 'a9856963-833a-419b-8668-85e9e45c1175', '17f63c08-b13d-4c5e-86c3-17aad69f9fa1']","['schemelike-metacircular-eval__DG6jChG', 'schemelike-metacircular-eval__PWdrpNs', 'schemelike-metacircular-eval__b7fN9aW', 'schemelike-metacircular-eval__qK9EDGb', 'schemelike-metacircular-eval__vhW5brq']",0,"[2410.727038, 1933.0568, 2435.919489, 2406.577526, 1486.135572]","[40.377176, 31.397021, 87.554736, 25.788846, 31.996926]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,sparql-university,5,"['76908251-b3f3-45e1-89a9-ab9016be7d87', '04ab7c9f-ce5c-46d2-a7da-d512fd63f9ca', 'f43ee00a-b8bd-4ea9-b25a-8fb9de2d7838', '777bf74f-c7e0-4a8d-8dc2-98ab0a5eb4e2', '93fc19f0-eb37-45e7-8f75-9dd3ee395ad5']","['sparql-university__6aCvU94', 'sparql-university__DsprTBW', 'sparql-university__JdgtKSG', 'sparql-university__4aeFNZg', 'sparql-university__9ugwCT2']",0,"[316.709093, 413.753981, 906.094128, 387.139545, 244.127457]","[37.967754, 16.522715, 350.593862, 50.429224, 58.480521]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,sqlite-db-truncate,5,"['11694e05-dd39-4133-90d4-44b0a3c2c831', '732dab7e-bf5d-48cb-a0f7-724c75bed214', 'dae4de34-7533-4679-a3ac-ffe6810d6ec6', '2c0bcaaa-4797-40c9-81ec-13da7993c33b', '03fb3fff-1f8b-4416-bcbc-44a7974cd67f']","['sqlite-db-truncate__3tq7S2Q', 'sqlite-db-truncate__SCTYNoT', 'sqlite-db-truncate__C97ibRW', 'sqlite-db-truncate__LQSppS2', 'sqlite-db-truncate__nwDz3a7']",0,"[696.839561, 900.048903, 394.126657, 276.167985, 638.45709]","[19.760045, 104.242514, 13.877192, 14.646549, 65.0506]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,sqlite-with-gcov,5,"['725182bf-d40c-4369-a573-d75b4e0e0005', '7aa15593-8d6e-426f-9295-1df9030a9729', 'a3af84d2-1ed8-4293-94ec-a59f23bda1f4', 'ceabc53b-4446-46d0-a5cf-6fe825f4990c', '4bc91b62-ce6a-4b2a-bb71-618424aa2c6c']","['sqlite-with-gcov__6Nx7GMY', 'sqlite-with-gcov__fWhazP5', 'sqlite-with-gcov__oouv6B8', 'sqlite-with-gcov__Q2srsFE', 'sqlite-with-gcov__ewNCPRe']",2,"[313.2702, 324.311196, 912.912405, 720.762943, 442.039122]","[13.832342, 46.723814, 67.181268, 95.132258, 31.776968]",0.4,False,"['ceabc53b-4446-46d0-a5cf-6fe825f4990c', '4bc91b62-ce6a-4b2a-bb71-618424aa2c6c']" +moonshotai/Kimi-K2-Instruct-0905,torch-tensor-parallelism,5,"['9989cbee-0411-4a8c-9f62-b919f07eeb0c', '86698a4e-39a5-4a74-91e1-87c1108d267f', 'b219161c-e366-446b-ae52-94a004ee464c', '18bffdab-4965-4fe7-90c1-bdfd01a67e02', '25cf14f0-7784-4aed-afdb-74274ce42929']","['torch-tensor-parallelism__TyAUZxw', 'torch-tensor-parallelism__Jc66Kdq', 'torch-tensor-parallelism__hEMJiPA', 'torch-tensor-parallelism__QW9fiky', 'torch-tensor-parallelism__mvvLFMX']",0,"[633.499363, 548.275601, 93.879562, 418.578883, 900.025716]","[40.6683, 23.565098, 24.747833, 102.032287, 22.452074]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,train-fasttext,5,"['3e3d44f8-ba48-4e70-b3d3-5f3a41ba121b', '0d167cd0-381d-4a6d-a377-91cbfb270860', 'd41b4881-05a7-4148-8d96-3f044bcce710', '61f28ccf-a7d3-4674-8fc3-c36c15b39e8f', '4b489bc8-c291-4280-87fe-f3e78f744c15']","['train-fasttext__yDmMAi4', 'train-fasttext__CmTQdUu', 'train-fasttext__uQzZCaU', 'train-fasttext__agLNZ2Z', 'train-fasttext__f5kL9qA']",1,"[3295.174305, 3606.317587, 1825.768686, 3198.453359, 3600.8256]","[52.893708, 77.545165, 20.54045, 12.508541, 136.035933]",0.2,False,['61f28ccf-a7d3-4674-8fc3-c36c15b39e8f'] +moonshotai/Kimi-K2-Instruct-0905,tune-mjcf,5,"['551d0d50-197f-4fe0-845c-7b48626119b1', 'c1b78f68-50ac-470a-82f1-468534ae49bd', 'aa86d76f-f732-4af2-b931-56fa8c29cbff', 'c183ee83-708e-428f-8b5e-b337a716dd1c', 'c6954ee1-ecc1-4470-9021-de12d1b58e50']","['tune-mjcf__9nNVEgp', 'tune-mjcf__VoHREcE', 'tune-mjcf__qiwtBPY', 'tune-mjcf__NJQni9i', 'tune-mjcf__n2cRgFU']",2,"[589.374911, 904.245024, 935.342423, 900.378612, 657.776508]","[21.014378, 13.974142, 84.345257, 8.592492, 47.073251]",0.4,False,"['551d0d50-197f-4fe0-845c-7b48626119b1', 'c6954ee1-ecc1-4470-9021-de12d1b58e50']" +moonshotai/Kimi-K2-Instruct-0905,video-processing,5,"['e0e6f36a-23fc-42b4-9179-df396a846625', 'f4e0a6c6-7226-4bfd-87e9-0ea53c38e392', '0ebc1507-08c2-4aa6-a7c6-a413218cf892', '1ebe098c-b6ab-4abd-bcc1-6963cb5f3af5', '163ae01a-b148-4b4b-ace9-20b989abf67d']","['video-processing__5B3xwbW', 'video-processing__UYovbPk', 'video-processing__EaGjStr', 'video-processing__dPSJfTq', 'video-processing__bP7MXtP']",0,"[249.703665, 499.243593, 499.261372, 388.241618, 256.62703]","[50.315684, 134.457188, 143.343109, 32.943867, 86.46742]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,vulnerable-secret,5,"['a30b4630-c39e-4ad7-91a9-29e0810e4b08', 'c61f5f26-8447-4932-9d30-640e19eaf9a3', 'e859f139-86f3-46f2-bfee-c76d9a4af199', '938c8306-ea85-4b48-9a8f-13ffd6299616', '25216d68-52ae-47fb-a886-27d89e4bd382']","['vulnerable-secret__Hr8saMZ', 'vulnerable-secret__fxzi7JL', 'vulnerable-secret__ygHyA6d', 'vulnerable-secret__ZDh3Rqz', 'vulnerable-secret__SS6KWsH']",1,"[907.945944, 910.738663, 904.522982, 904.684933, 719.419793]","[76.22678, 14.011213, 12.843862, 13.086458, 10.111499]",0.2,False,['25216d68-52ae-47fb-a886-27d89e4bd382'] +moonshotai/Kimi-K2-Instruct-0905,wasm-pipeline,5,"['fa2f8c5e-cec5-45e3-9e45-890fb2452cbc', '62d25046-bf12-4cb2-ac5a-c60d60d648a0', '62195ec7-b3ea-4f19-828d-8fcc0b60bc6d', '2f0c5bb1-82c1-4057-a4bb-af22f7e5b3fd', 'd6a7e673-c414-46a1-b2bd-65f3bdeb5a25']","['wasm-pipeline__nahE5qQ', 'wasm-pipeline__Poqfupa', 'wasm-pipeline__qTdWq49', 'wasm-pipeline__K76TpCo', 'wasm-pipeline__J8thWXR']",1,"[946.478056, 916.817123, 357.450057, 634.842622, 829.864205]","[63.190852, 14.560507, 21.246859, 12.118952, 19.006295]",0.2,False,['d6a7e673-c414-46a1-b2bd-65f3bdeb5a25'] +moonshotai/Kimi-K2-Instruct-0905,winning-avg-corewars,5,"['fc133464-aad8-47d1-a846-b7b52278b7f7', '7c09e20f-6bf7-482b-89a5-23a9d356d053', '23c6deb2-a46c-4d51-bf96-d226c14c5a80', '9384f5b8-214c-427b-990b-de9cfce76bdb', 'de079411-a6b5-4929-ab67-eb1cd8cf93b7']","['winning-avg-corewars__ArrkGW6', 'winning-avg-corewars__dEbhSSH', 'winning-avg-corewars__juyuY2c', 'winning-avg-corewars__koQiUXq', 'winning-avg-corewars__HX6czyX']",0,"[2741.376983, 1136.614409, 2585.892994, 836.514908, 2882.272548]","[8.61334, 29.284359, 54.701238, 9.246336, 84.303928]",0.0,False,[] +moonshotai/Kimi-K2-Instruct-0905,write-compressor,5,"['d6c8edd1-e031-41ed-b4bf-7b808e8ad427', '57e04059-2ca8-488a-b431-77f66ff880e9', '270204a5-fa6b-42a4-b9cf-cd7843a286fa', '189c55ce-6e82-4ee6-bd1e-0e4e43e39794', 'f498dc16-86fc-4746-a99f-066aa5c8f3d7']","['write-compressor__TiYvzeZ', 'write-compressor__cqM6o6p', 'write-compressor__FTj97Cy', 'write-compressor__mhMQRJC', 'write-compressor__iMgzYxy']",0,"[939.934948, 782.580816, 900.032755, 900.378559, 902.347031]","[123.067264, 22.184398, 21.84505, 82.909814, 25.333353]",0.0,False,[] +openai/gpt-oss-120b,adaptive-rejection-sampler,5,"['faeeb025-41d2-4ea6-8445-0fe223b4bc41', '064cef09-19de-46a2-bc45-6e9f67524e7f', '840a0d3b-6647-4c8f-a6e8-148678c1c146', '142c88ab-1bfc-4243-8a50-441a4e82567d', 'b9cd2030-c82f-4307-bd16-b87826698f91']","['adaptive-rejection-sampler__F8Pth9A', 'adaptive-rejection-sampler__BqwK2Ys', 'adaptive-rejection-sampler__kiwqcm7', 'adaptive-rejection-sampler__Bk5w6LX', 'adaptive-rejection-sampler__Tpa3XnE']",0,"[530.766233, 217.827978, 902.183438, 701.928281, 455.291343]","[87.982821, 138.768842, 67.810637, 58.28808, 87.024815]",0.0,False,[] +openai/gpt-oss-120b,bn-fit-modify,5,"['aa1572f4-169c-4092-912b-52f3d2f28782', '4c465ca1-4bcf-417b-b1ba-fd2a19241a3c', '6ba6f338-43c3-4f33-918e-267177f98468', '5a08ef44-1b42-44b2-9afd-3898bf4773a0', '518167f4-76d1-447b-b58f-cd76602fcfbb']","['bn-fit-modify__z8XL9pD', 'bn-fit-modify__6hdAj9g', 'bn-fit-modify__kprWpc2', 'bn-fit-modify__sHTNePC', 'bn-fit-modify__akUffjg']",1,"[274.847726, 388.341266, 1834.933602, 208.541532, 194.462602]","[148.959492, 73.845021, 154.331114, 41.910584, 197.912018]",0.2,False,['4c465ca1-4bcf-417b-b1ba-fd2a19241a3c'] +openai/gpt-oss-120b,break-filter-js-from-html,5,"['85eed476-988c-4c70-a41c-be830e1dcdc3', '3362673f-f8a4-4b81-aacd-c073df21690d', '5774efab-97fd-4112-999f-d57b3591a08e', '3081e06c-eebf-4d7c-857a-8dff22e4b6ab', '117e281a-7f97-4c9a-bd8c-575d07d72161']","['break-filter-js-from-html__VGiR8EQ', 'break-filter-js-from-html__auiwbam', 'break-filter-js-from-html__MoG5eN8', 'break-filter-js-from-html__k37AwEm', 'break-filter-js-from-html__7deskAU']",0,"[1254.780368, 355.495715, 1208.666921, 72.120748, 115.633334]","[116.182021, 7.467026, 52.163213, 50.833337, 55.59159]",0.0,False,[] +openai/gpt-oss-120b,build-cython-ext,5,"['bf5def0b-35e3-43a1-abac-f8cbd1f16d5d', 'd9eca115-e0c3-463d-98b2-a9dc24bf7b3f', 'a4ba2774-dfd3-4fd5-bfe7-9dff16d353ed', '963bc5ef-b5f7-4b98-83fc-c806208a1972', '35cf8209-eb58-483f-8dd5-c34a435cfeb0']","['build-cython-ext__pjpeMUo', 'build-cython-ext__5jncGjF', 'build-cython-ext__SqxXKmb', 'build-cython-ext__EcCAY2E', 'build-cython-ext__9A72uvd']",0,"[912.055555, 900.472911, 900.540037, 902.247733, 900.36206]","[37.360216, 74.394331, 14.83845, 237.707213, 195.75203]",0.0,False,[] +openai/gpt-oss-120b,build-initramfs-qemu,5,"['22caa237-7018-49d7-99a9-439d403fa56b', '126658b8-b075-40a4-b379-221579a64bcc', 'b709b08b-42aa-4bbe-b473-a201174d501b', 'a8a7114f-cac2-477b-9042-4012a0240cbc', 'a53dc8c4-095f-417a-9cc0-01167b96fe1d']","['build-initramfs-qemu__zzekKs2', 'build-initramfs-qemu__szqrxUt', 'build-initramfs-qemu__3QYbeu4', 'build-initramfs-qemu__fbotyH4', 'build-initramfs-qemu__Nk5gPsd']",0,"[136.322567, 303.618472, 187.639593, 916.297652, 192.336938]","[56.634104, 10.597856, 91.300855, 27.163713, 251.151549]",0.0,False,[] +openai/gpt-oss-120b,build-pmars,5,"['537ace88-a5c4-473b-a497-625221d892f1', '0b5bdcac-a289-43e1-a0c2-d67b6c50d789', '03860372-7808-4d99-8ea7-f58621da134b', '5ebb5a6a-3316-4c6a-9f26-2a3bbdab6408', 'cc99d103-67e7-4e3d-97d9-5d9b31b0f706']","['build-pmars__FeYDePv', 'build-pmars__gh9M6ER', 'build-pmars__sDayypm', 'build-pmars__GQR9KE2', 'build-pmars__zmCaxzt']",1,"[900.935693, 915.518592, 775.80269, 900.501102, 904.576425]","[12.945904, 71.009048, 3.338607, 4.910237, 36.127234]",0.2,False,['03860372-7808-4d99-8ea7-f58621da134b'] +openai/gpt-oss-120b,build-pov-ray,5,"['663f4f86-68cb-44d8-8093-5994321c1fb5', 'fa493922-de8b-413e-a8d0-ea4719ae7a60', '96d2fadb-b05e-4893-a004-f23de8259aa4', '59d9d525-de3e-46c8-9ac2-620e9c62bccc', 'aa59ad01-e2ee-4f80-aa45-0d725fa8a7e5']","['build-pov-ray__asMmMue', 'build-pov-ray__tDEE7ki', 'build-pov-ray__M2XvLcV', 'build-pov-ray__57FDSev', 'build-pov-ray__W8DCCsu']",0,"[1171.269573, 4434.340658, 5515.988431, 6000.725107, 1982.660405]","[32.025248, 52.930933, 46.144922, 31.167965, 17.639901]",0.0,False,[] +openai/gpt-oss-120b,cancel-async-tasks,5,"['c7a18052-035d-419f-83df-cee2a0f02b56', '225291d5-e73d-4a74-9d07-962b43a3bb10', 'e8ce1179-b3e5-406a-9e28-675bfe510eb0', 'e467dd30-9015-4936-98a1-34023bc288b5', 'b95e474b-cf55-46d9-a8e2-c858dd3424b6']","['cancel-async-tasks__MSJfokf', 'cancel-async-tasks__qkek47q', 'cancel-async-tasks__MdUD6Wa', 'cancel-async-tasks__QSyuAyr', 'cancel-async-tasks__mWMjQiU']",3,"[80.955706, 24.594396, 84.453769, 61.728873, 50.402216]","[94.669266, 48.520103, 134.447342, 34.856036, 57.67464]",0.6,True,"['225291d5-e73d-4a74-9d07-962b43a3bb10', 'e8ce1179-b3e5-406a-9e28-675bfe510eb0', 'e467dd30-9015-4936-98a1-34023bc288b5']" +openai/gpt-oss-120b,chess-best-move,5,"['d65ab5f7-7c05-4002-9c09-4d7432cbfef8', '023e5e03-2195-4f15-8cfa-203b94caa5a0', '13dcf215-3eb1-4998-8420-73dd73409e84', '2da8398c-fb0c-4380-bf10-200891b839b1', 'f758b943-1fb6-47f0-8f1d-5a206c158839']","['chess-best-move__opYhbFU', 'chess-best-move__jUm6GSi', 'chess-best-move__EJ9drc3', 'chess-best-move__nutkSyC', 'chess-best-move__JzxyjjV']",0,"[332.801006, 416.918374, 524.814307, 805.521973, 902.75813]","[118.377106, 13.301788, 36.084309, 7.367226, 54.602217]",0.0,False,[] +openai/gpt-oss-120b,circuit-fibsqrt,5,"['cf605add-f801-44c7-824b-2e7de38ba337', '1dcdb912-1680-451e-a8e1-0eb3a19eb1a3', 'e46ffdbd-30d7-45ed-a7e5-491ff51e0dc5', '7bdac175-6fbd-4f65-924c-a5e6439c6c65', '65350c5b-6ca5-4310-b638-dfed4526d13b']","['circuit-fibsqrt__rMbFVbH', 'circuit-fibsqrt__S3yECSm', 'circuit-fibsqrt__SwCFa7G', 'circuit-fibsqrt__dj3u2wH', 'circuit-fibsqrt__uRqGcyh']",0,"[1155.87658, 3624.499176, 977.746549, 2855.665421, 706.457559]","[156.963412, 56.079608, 46.119424, 19.719806, 147.598855]",0.0,False,[] +openai/gpt-oss-120b,cobol-modernization,5,"['aa0a7438-d92e-4c60-b9ce-8cb13d7cfa0d', 'd58a333c-c74e-41d6-9062-21be85c74b1e', '08c2bd66-3b62-478d-9200-d64e4733a219', 'f7921767-d1dd-436e-babf-328a6c9fb99e', 'b8636d76-e8f3-4ae2-a6d0-f85726172856']","['cobol-modernization__CBxMeUK', 'cobol-modernization__LyX86qp', 'cobol-modernization__PhxjGyb', 'cobol-modernization__gLhJGta', 'cobol-modernization__3FWWGj5']",4,"[880.826442, 172.744965, 200.779358, 173.758361, 124.369042]","[120.294645, 51.789064, 45.868924, 52.813319, 68.104717]",0.8,True,"['aa0a7438-d92e-4c60-b9ce-8cb13d7cfa0d', 'd58a333c-c74e-41d6-9062-21be85c74b1e', '08c2bd66-3b62-478d-9200-d64e4733a219', 'b8636d76-e8f3-4ae2-a6d0-f85726172856']" +openai/gpt-oss-120b,code-from-image,5,"['702f9780-a0f8-465a-92ee-3bfac2848537', 'b6334679-32dd-436d-b06a-ac0d492406d9', 'e55a994f-114e-4324-8723-89dbf1dd0762', '1d481c69-4d91-4a84-8618-67724ddf70a7', '4f369f3f-2d33-40d5-9e31-ec17dabc3ae5']","['code-from-image__8aNQusA', 'code-from-image__L3gCbxf', 'code-from-image__UDSXbSi', 'code-from-image__gMKS246', 'code-from-image__t8a6qrH']",0,"[163.994538, 315.091059, 1220.886275, 175.473043, 741.887313]","[37.83932, 9.207699, 23.73477, 44.977702, 65.061674]",0.0,False,[] +openai/gpt-oss-120b,configure-git-webserver,5,"['3d16d4f1-087b-4562-9a9f-4b1bdf96aa73', '9b849f08-0957-4233-9d7c-a4f3dca594e9', '458cca10-69c2-4cc9-90af-b29853ae757a', '0952b483-f724-4859-954f-ee6ab4bfad53', '1114b076-eb58-463a-8d8e-ba0484ee3dbf']","['configure-git-webserver__B4c2pUZ', 'configure-git-webserver__2mifLgy', 'configure-git-webserver__ujpYz8T', 'configure-git-webserver__XviQNcN', 'configure-git-webserver__wvLwE3r']",3,"[209.571504, 379.191672, 168.864368, 295.40014, 568.77527]","[59.00492, 56.485986, 37.030413, 81.125707, 95.926653]",0.6,True,"['9b849f08-0957-4233-9d7c-a4f3dca594e9', '458cca10-69c2-4cc9-90af-b29853ae757a', '0952b483-f724-4859-954f-ee6ab4bfad53']" +openai/gpt-oss-120b,constraints-scheduling,5,"['11f477db-b168-4c19-96ae-5f8efc0f5313', 'a7273f7a-24a8-4067-9630-9aaa3e3afeff', '29eb6cff-0a4a-47bf-8ed8-535972a06a4c', 'eebee320-bc48-412e-9d6a-f3a116f7a014', 'feb1c748-359f-462e-ab64-21f015cd04a7']","['constraints-scheduling__jtH8m7g', 'constraints-scheduling__6XGgjrd', 'constraints-scheduling__UuwwW2R', 'constraints-scheduling__ko4E9CR', 'constraints-scheduling__9M5oxUy']",5,"[451.557666, 104.04398, 297.344998, 47.99831, 50.011653]","[52.72, 27.603674, 135.663548, 151.478515, 38.133512]",1.0,True,"['11f477db-b168-4c19-96ae-5f8efc0f5313', 'a7273f7a-24a8-4067-9630-9aaa3e3afeff', '29eb6cff-0a4a-47bf-8ed8-535972a06a4c', 'eebee320-bc48-412e-9d6a-f3a116f7a014', 'feb1c748-359f-462e-ab64-21f015cd04a7']" +openai/gpt-oss-120b,count-dataset-tokens,5,"['13869209-40bb-4e17-9b0a-7b90030c28c9', '7fe934b6-ce99-462a-a33e-48d88b051ad4', '146d3748-d33a-4eaf-a03c-be1b9a411226', '6c42b8b7-454e-49ce-a596-ee97d6e4f1a4', '55bfe684-05df-4cfd-b629-4a699cc0d931']","['count-dataset-tokens__PrYVpLa', 'count-dataset-tokens__zUa3Mhm', 'count-dataset-tokens__xYHWoMM', 'count-dataset-tokens__i32EYBz', 'count-dataset-tokens__YQRR7Uj']",0,"[243.517091, 428.644218, 386.720148, 173.911279, 189.466334]","[54.025886, 101.572249, 30.70396, 41.505664, 45.807643]",0.0,False,[] +openai/gpt-oss-120b,crack-7z-hash,5,"['80f610d8-bf0d-400c-9585-8efee8808abc', '54efa7af-b259-4c81-8b78-cbd714ec1683', '16c5def7-83a1-42b7-9ffb-d7065da572e0', '6447806c-dc8d-45e7-b25a-96d83e545f11', 'f4ece6ec-71bb-4cab-9146-50ee0d232963']","['crack-7z-hash__chZSUeZ', 'crack-7z-hash__s8CHygu', 'crack-7z-hash__YJVU5Ya', 'crack-7z-hash__LPukPnw', 'crack-7z-hash__gJC8hfd']",0,"[152.699364, 459.091632, 335.898885, 220.401171, 900.039488]","[27.475345, 9.843868, 139.522959, 25.862903, 46.593719]",0.0,False,[] +openai/gpt-oss-120b,db-wal-recovery,5,"['b889594d-fbf7-421d-a79d-5e87e8e7a6ee', 'b92f316d-8c02-4050-81d2-fabf60ac837a', '2fdd92d7-8a94-49c1-afe2-96efcf838124', '642bf13e-2e14-4932-a934-1fa2f8a4f5e9', '93d15a5e-3404-4214-b019-f6dc8234986b']","['db-wal-recovery__xv49Bk6', 'db-wal-recovery__bJz5fuL', 'db-wal-recovery__f8XhHKr', 'db-wal-recovery__4Ds9zY4', 'db-wal-recovery__UcyfT8t']",0,"[348.080385, 938.49404, 900.433352, 213.828565, 1004.927055]","[12.813678, 30.742533, 7.948316, 15.258408, 37.968015]",0.0,False,[] +openai/gpt-oss-120b,distribution-search,5,"['18a8c0ed-a138-457a-bc5f-e904f3654bc4', 'e3db734e-eeb3-40e9-a923-66b4270fa87b', 'b7690543-5521-48f5-8444-6a71335383cd', 'b3ca475f-a346-4ba2-86d3-4560fffc7555', 'b901d937-656c-415e-a1cd-3580abbc9d8c']","['distribution-search__KTLRYDy', 'distribution-search__UB4CPmK', 'distribution-search__YLp67ut', 'distribution-search__2A9cM54', 'distribution-search__gcAHfG2']",0,"[102.519354, 94.120256, 89.602971, 83.750681, 105.243984]","[26.038607, 165.684776, 206.522618, 33.213815, 27.66766]",0.0,False,[] +openai/gpt-oss-120b,dna-assembly,5,"['c80b612e-c453-4a90-a539-431647251b3c', 'ddf1e92e-9eba-4f78-ae68-f1884650d3e2', '22ff6409-3676-44da-8361-fd93f8004708', '559da0f5-1237-48be-b18a-fe0e36660886', '0000900d-99a6-492a-b6cc-dc3a02a8e29b']","['dna-assembly__tFvzjSy', 'dna-assembly__U5XrWVH', 'dna-assembly__YpWyRnT', 'dna-assembly__LoDokrm', 'dna-assembly__cytQbEp']",0,"[737.300847, 187.498913, 85.843506, 171.88872, 73.196696]","[52.068904, 105.866888, 23.741501, 35.73528, 142.161352]",0.0,False,[] +openai/gpt-oss-120b,dna-insert,5,"['0f30e67a-d2c4-46eb-8611-c5db4f5d4245', '4f14594b-ded0-409e-b094-79b86b4fe4cc', '92af63b5-7b45-41cb-b64d-f5d2ce424461', 'bd046d7a-136a-4ff1-9dec-2959cd91a50a', '8864f8dd-7ec5-4830-8214-c46ad3c36599']","['dna-insert__sNT7hUG', 'dna-insert__7sYiqP2', 'dna-insert__q5d64pX', 'dna-insert__KU6B4Yx', 'dna-insert__H2Lm9eH']",0,"[363.300554, 393.16437, 373.07906, 631.457432, 362.636901]","[80.062844, 15.074783, 29.0549, 237.637554, 23.418467]",0.0,False,[] +openai/gpt-oss-120b,extract-elf,5,"['2aadb4a7-acb4-4c8e-8744-ba5f6f68196c', '1a6d60d2-b17d-422d-bb7b-094840bc7eea', '0295b364-9818-43be-9fb6-e0a0d3bc0aa5', '6120b5c2-4af1-439f-8b55-45de899d7236', '0395eb15-b3bd-4af3-b376-9966e50c71f2']","['extract-elf__xjdaCPK', 'extract-elf__PdQNVum', 'extract-elf__m2LpNis', 'extract-elf__kM5Ztab', 'extract-elf__Nzds3rQ']",2,"[231.194484, 213.657684, 232.823262, 286.513563, 102.883306]","[22.545124, 134.972658, 108.327104, 65.335964, 12.63683]",0.4,False,"['1a6d60d2-b17d-422d-bb7b-094840bc7eea', '6120b5c2-4af1-439f-8b55-45de899d7236']" +openai/gpt-oss-120b,feal-differential-cryptanalysis,5,"['7ac18365-fbee-46f4-9c71-a026fe955df2', '168c4f60-c6b6-4160-afab-1d4ea1590c75', '147ee5a8-f2fb-4987-a5ac-38e2e6ee8929', '49309084-4303-4efd-9374-e2cf38fddc89', 'dc81e877-45c9-4c2c-bf96-4178a8218847']","['feal-differential-cryptanalysis__Hxw5QyU', 'feal-differential-cryptanalysis__mNybosc', 'feal-differential-cryptanalysis__RHBXQmJ', 'feal-differential-cryptanalysis__8iDCroD', 'feal-differential-cryptanalysis__qhnWMny']",0,"[247.940154, 289.170768, 139.054137, 273.113123, 310.606706]","[259.033895, 163.034282, 45.605724, 76.55396, 104.699105]",0.0,False,[] +openai/gpt-oss-120b,feal-linear-cryptanalysis,5,"['d0d3874e-d84c-4023-98a6-442a6a108422', 'bf984497-d26d-4954-b0a9-af0b58c66839', '8cb3e20e-abfe-4be8-ba31-c2613efe1532', 'f1f9f9b3-6288-4fa2-bc31-945f240193f3', 'e0b54c21-7a19-4106-87a2-4c9bdd9882ce']","['feal-linear-cryptanalysis__Kbmwp3f', 'feal-linear-cryptanalysis__YaLwcGP', 'feal-linear-cryptanalysis__fF3Gtpm', 'feal-linear-cryptanalysis__H53XLCE', 'feal-linear-cryptanalysis__gSzFqx6']",2,"[522.078941, 667.512408, 192.086214, 1800.858603, 210.976295]","[212.21086, 27.372511, 46.786849, 24.43319, 60.796172]",0.4,False,"['bf984497-d26d-4954-b0a9-af0b58c66839', 'e0b54c21-7a19-4106-87a2-4c9bdd9882ce']" +openai/gpt-oss-120b,filter-js-from-html,5,"['c60e38e2-9509-4fb1-85eb-7a681c57cf4c', '08d6e1c2-f9d3-4165-bddd-d720993958ea', '99c0627c-6e49-4fdb-a230-ac59625cc09c', 'b5ad66fd-7890-4df2-ba41-bb9fdef2f075', 'e583ab23-4f8b-4ea4-9cb6-b84fce1973d8']","['filter-js-from-html__B7B7jh2', 'filter-js-from-html__essqQ3F', 'filter-js-from-html__5vT5Pc5', 'filter-js-from-html__tpcXodW', 'filter-js-from-html__5u2yP2t']",0,"[423.723401, 59.085328, 37.773888, 173.466687, 14.817925]","[60.008731, 47.241614, 35.650424, 58.027639, 26.007691]",0.0,False,[] +openai/gpt-oss-120b,financial-document-processor,5,"['7c6e1ea2-5271-46a9-8423-a481df3d362c', '57e53842-e0e2-42a3-a262-7b131a3ea3d3', 'd596ec83-9337-4876-b656-55f1e4d81d4a', '08c3fca4-5ccf-4f35-8de4-8515f8ca0e6c', 'be880ce4-3ffb-45ea-b5a6-52c3879eb707']","['financial-document-processor__nc4VLS8', 'financial-document-processor__4L2v5Gr', 'financial-document-processor__9QCodme', 'financial-document-processor__vFLSh4N', 'financial-document-processor__jrCpKR7']",0,"[149.308662, 287.284738, 85.524672, 360.900964, 786.169261]","[105.564771, 41.299511, 33.926184, 254.189701, 29.252571]",0.0,False,[] +openai/gpt-oss-120b,fix-code-vulnerability,5,"['a4aa8ddd-bc91-416c-8bec-f8c8e4c71655', '6c3e5b9f-0193-4fea-9098-c4f01174cc73', 'e034aa30-7135-4787-94ed-a2b9a686e080', '6f27a6ea-6f12-4bd8-bcac-196bf6b46c42', '28e10d7f-64e9-4b6f-9905-fa9bfed1a9fa']","['fix-code-vulnerability__q3xoWJm', 'fix-code-vulnerability__o2m84PB', 'fix-code-vulnerability__qMqn7Kn', 'fix-code-vulnerability__ghTVCa3', 'fix-code-vulnerability__uzS22pq']",0,"[900.181918, 511.118547, 904.445221, 79.437651, 982.965566]","[3.354842, 26.188564, 25.858952, 4.3598, 44.086854]",0.0,False,[] +openai/gpt-oss-120b,fix-git,5,"['89ff8175-d909-484a-9228-d523a6cd6335', '51087244-cf29-421a-aa48-040bb72177c5', 'e5b9f04d-951c-4611-8087-b24b3fa3d703', 'c85b9247-8a5c-44dc-be6e-1e560f079900', '395723e2-c50c-4bdb-8a94-d0353f337d4e']","['fix-git__ywpZN52', 'fix-git__xae7DAe', 'fix-git__w5uemMA', 'fix-git__RmGzHi4', 'fix-git__rhP8cWn']",3,"[261.036047, 420.166207, 124.362502, 136.63619, 905.16125]","[49.244581, 42.14706, 22.46506, 16.786263, 39.21254]",0.6,True,"['51087244-cf29-421a-aa48-040bb72177c5', 'e5b9f04d-951c-4611-8087-b24b3fa3d703', 'c85b9247-8a5c-44dc-be6e-1e560f079900']" +openai/gpt-oss-120b,fix-ocaml-gc,5,"['308438a9-434b-4e9c-9e07-291bfcdbb6a8', '8e5635ca-df06-441e-b8a6-97135f191b69', '97c95118-1ccd-482d-be34-6ef8ebe081de', '76ffc68f-298c-4a17-9af8-2ebf6764985a', '7403a09a-0fc1-451f-b066-27f71cd7562a']","['fix-ocaml-gc__r2sKaLs', 'fix-ocaml-gc__hT2Mir9', 'fix-ocaml-gc__cMioFD2', 'fix-ocaml-gc__5Ff8BBi', 'fix-ocaml-gc__3Xm7ZcX']",0,"[3622.551929, 3607.898232, 3646.360484, 3617.420311, 3852.052565]","[39.69319, 33.124698, 27.260859, 106.263851, 41.059568]",0.0,False,[] +openai/gpt-oss-120b,form-filling,5,"['c5821718-9037-426b-a94f-43df426362a8', '152e4a54-47e2-4cfc-af48-5eef0432d035', 'ee0b3f4d-5bb5-4cad-b349-1ed614e6cbf0', '10643166-85aa-4dfa-b28a-585ec4ba4ce7', 'e3e8a5dc-d931-446a-b5f8-95798559528e']","['form-filling__JxreReQ', 'form-filling__EXJPC6q', 'form-filling__UShW8Wh', 'form-filling__avoLGta', 'form-filling__KwrQWHF']",3,"[68.063662, 455.258407, 226.702148, 60.202199, 132.03676]","[9.813272, 21.957647, 11.316964, 23.60058, 17.261704]",0.6,True,"['c5821718-9037-426b-a94f-43df426362a8', '152e4a54-47e2-4cfc-af48-5eef0432d035', 'e3e8a5dc-d931-446a-b5f8-95798559528e']" +openai/gpt-oss-120b,git-leak-recovery,5,"['7415e9c8-bec2-4af8-a5d4-07ecd3aad706', '27d7ccc7-7795-45a2-85aa-3e3d4ac91d6e', '15d03be4-680f-429b-bb5b-b736edcf1895', '165dfcae-d81e-42d6-b04b-5290130548b3', 'b9dc9fdd-9255-4966-9a0a-bff97c3b2d59']","['git-leak-recovery__p4ZBXY5', 'git-leak-recovery__Y8QuhEb', 'git-leak-recovery__Lw7DST4', 'git-leak-recovery__Q6RLkMM', 'git-leak-recovery__5MsVZgy']",1,"[62.324182, 72.803329, 349.064746, 108.627261, 196.66383]","[78.88185, 183.365641, 45.879913, 28.07565, 72.491153]",0.2,False,['15d03be4-680f-429b-bb5b-b736edcf1895'] +openai/gpt-oss-120b,gpt2-codegolf,5,"['61c1ebd6-ecd2-4589-aba4-dc0e8e9103bd', '23f3c0c3-60ed-4ee6-b36e-d77d0c250506', 'd58cf7c7-1b18-4476-a66d-cd11b5ec9cd6', '67484e4e-39b0-4977-b1cf-317583dbb287', '219314c6-3848-4ad1-9449-c6fbe06e5f82']","['gpt2-codegolf__eQjp3GU', 'gpt2-codegolf__DvGDgx3', 'gpt2-codegolf__QnhWNjr', 'gpt2-codegolf__CRPZS9L', 'gpt2-codegolf__UPSNJSV']",0,"[213.935991, 901.131075, 490.102273, 910.407775, 608.671783]","[357.829044, 134.489061, 166.109075, 165.070082, 38.157169]",0.0,False,[] +openai/gpt-oss-120b,hf-model-inference,5,"['2c1c8620-33bb-4f7a-9e26-afca1ae296b3', '67f6ab68-2c9f-43d1-83d5-a8a33ada9ad1', '9e97df51-00bf-4537-a05b-52e81406872f', 'a0e2fc2b-6448-43c3-a8c4-20d68f9401ae', '6620592f-7629-4e2a-809f-8a17218f9828']","['hf-model-inference__FG3mFzC', 'hf-model-inference__GrgqpSr', 'hf-model-inference__a7Jr34c', 'hf-model-inference__rAtVkaC', 'hf-model-inference__yDZhfhg']",0,"[344.412713, 81.434178, 432.93709, 112.271213, 136.968838]","[76.216159, 43.648052, 29.177762, 41.893553, 30.392303]",0.0,False,[] +openai/gpt-oss-120b,install-klee-minimal,5,"['c6c0c9c3-ceff-4a90-a4d7-afcd7cca8143', '09eb0f32-fe90-4b5f-8ac8-b98abf8824fb', '9fc225d5-3115-4f43-b789-cf2a7508f53e', '64e07463-a844-42bf-a4b9-1fa96080a741', '6996ed8b-bfcb-4daa-af5a-cbeea8248184']","['install-klee-minimal__W4HNxJQ', 'install-klee-minimal__BW99iTh', 'install-klee-minimal__7oGu8LH', 'install-klee-minimal__jPPtM7B', 'install-klee-minimal__ipCHgpV']",0,"[844.496042, 440.05567, 900.162637, 900.002167, 906.714287]","[54.87522, 89.604835, 92.263396, 101.915399, 77.19314]",0.0,False,[] +openai/gpt-oss-120b,install-windows-3.11,5,"['224c96a0-dd65-4d8f-84f7-d51266b16515', 'cbbab881-3117-4bcd-8627-2375f6e76ba7', '3515c5ce-4ba8-43d8-8b4a-7548d84bc8dd', 'c4d862d2-0938-4e03-b418-e0a34b632590', '36eda90b-64ae-4353-a05e-b9c249bcd2ee']","['install-windows-3.11__pXFtfxR', 'install-windows-3.11__YX3syqM', 'install-windows-3.11__DDNRgzF', 'install-windows-3.11__yQSd6Sp', 'install-windows-3.11__dC7bycy']",0,"[68.857492, 106.370422, 214.174458, 99.331575, 265.171101]","[118.780734, 26.562346, 19.557922, 63.746026, 31.410272]",0.0,False,[] +openai/gpt-oss-120b,large-scale-text-editing,5,"['c7f44e5c-d19b-45c7-8435-5ef25aeb84c1', 'd8f3a31b-8117-448b-b3a2-76d6af2bdcd7', '05b9a65e-21a9-486e-b774-3cb081b1da3f', 'ea2a6674-e248-495d-b33a-324116f6a87f', '609a4dbc-cc97-47a3-984d-f1ab42be02e1']","['large-scale-text-editing__6pY54rq', 'large-scale-text-editing__aapCViR', 'large-scale-text-editing__vMKHLJN', 'large-scale-text-editing__muA2n9k', 'large-scale-text-editing__2JjrAjr']",0,"[1243.511917, 1212.308338, 124.59175, 169.447121, 1228.576369]","[230.237811, 66.609163, 12.4911, 284.503629, 25.49039]",0.0,False,[] +openai/gpt-oss-120b,largest-eigenval,5,"['747cd308-e681-451a-91ff-fdf0271a8366', 'aab53a59-5ee6-49f9-8d18-9a7e202b3bc5', '0a20299f-a983-4f70-bfc6-54084b805f60', '5f36c3b8-8bb8-44bf-b68e-8f19fa96c1dc', 'aa6079f2-f1b2-48a5-8024-89d587a1d1d8']","['largest-eigenval__r3mJMEk', 'largest-eigenval__mBQwMSL', 'largest-eigenval__N4sYX3M', 'largest-eigenval__sx4fj4s', 'largest-eigenval__5aJcz8X']",0,"[900.036554, 900.002571, 912.980275, 921.148706, 900.004603]","[102.758596, 158.722084, 110.872741, 58.903867, 84.737278]",0.0,False,[] +openai/gpt-oss-120b,log-summary-date-ranges,5,"['d8a56aba-4c25-4f56-af23-d1e7180d9ff1', '4cc61104-c20a-40c9-a5c6-db5500ac786f', '3153e3ab-3d98-4261-aa9e-a1c149b964aa', '909acbce-5d68-428e-978b-09e519930c8c', 'eec49838-b1f3-4eb6-b24b-b41872c08fa7']","['log-summary-date-ranges__3mZbA8U', 'log-summary-date-ranges__3k52StT', 'log-summary-date-ranges__2PtyCfy', 'log-summary-date-ranges__8k2L5ea', 'log-summary-date-ranges__MRzsaw7']",0,"[24.000834, 116.518906, 95.80214, 91.054566, 65.117263]","[28.148446, 71.795492, 51.161636, 15.359259, 83.625433]",0.0,False,[] +openai/gpt-oss-120b,make-doom-for-mips,5,"['933b3917-9a41-4b0d-8531-179c63a40e51', '11bc9253-3243-4013-8211-37f5bb2ea246', '66404b00-9bee-4340-b1c6-87139906e5f4', '123eeeab-4f1e-4f0a-8ee0-ef6f88a82f5f', '07a36267-0f21-4f98-88db-732144ddff0f']","['make-doom-for-mips__sfnMwyR', 'make-doom-for-mips__yoLQDeQ', 'make-doom-for-mips__g5hXGVZ', 'make-doom-for-mips__7KDUcdV', 'make-doom-for-mips__Ak2BGJc']",0,"[900.576974, 902.678084, 900.074141, 907.782117, 966.58628]","[51.875306, 104.922321, 291.920094, 31.10101, 174.166594]",0.0,False,[] +openai/gpt-oss-120b,make-mips-interpreter,5,"['6955d6e1-c4ad-47c0-81c7-dbe45c22c211', 'ae175cae-b553-44fe-9ff9-66df2149cce6', '2d475720-4f6e-4d19-b7d2-e0c6b6f45179', 'aaf28db0-7afb-445d-98c7-b0b6ea17ddb1', 'ff555fb1-798c-4c2b-b26a-150666b8168e']","['make-mips-interpreter__KuwWBZk', 'make-mips-interpreter__TMXbkNa', 'make-mips-interpreter__TzQXDyi', 'make-mips-interpreter__ny2iiiz', 'make-mips-interpreter__TPQSH2J']",0,"[1815.799916, 1800.490537, 1810.701113, 1802.664278, 1805.902352]","[265.88606, 87.231893, 44.353438, 67.718376, 71.615538]",0.0,False,[] +openai/gpt-oss-120b,merge-diff-arc-agi-task,5,"['8985e1bf-01b5-43f4-a9ab-e94ffcd5aa35', '1906f849-da3a-4728-a22c-4a79ea4c7d0f', '68bd8595-ef59-451f-938f-e0f035b8144a', 'c3d1d64d-1011-42e9-a4b2-7b14d8caa603', '8f970467-15d1-460e-83ba-852e8e198f69']","['merge-diff-arc-agi-task__C8UT7Xp', 'merge-diff-arc-agi-task__xJ6RKFZ', 'merge-diff-arc-agi-task__mzbpTah', 'merge-diff-arc-agi-task__GemddmC', 'merge-diff-arc-agi-task__xpGMhwY']",0,"[206.437032, 272.444211, 912.786288, 154.486227, 457.203985]","[20.32571, 51.347815, 69.09869, 76.196224, 29.037205]",0.0,False,[] +openai/gpt-oss-120b,model-extraction-relu-logits,5,"['0a5ea382-2579-4a5b-8712-3adaaac0f7a5', '5db0491c-697e-405f-9164-a1258d139e01', '1eb8980a-30fb-430c-9943-c8c0dd682126', 'bd049ae5-a453-44cf-9d94-ff498d27a67a', '95912b7e-a302-486c-aca7-fcbece978172']","['model-extraction-relu-logits__YWgT4Eu', 'model-extraction-relu-logits__sgPnjPX', 'model-extraction-relu-logits__zTMvVFu', 'model-extraction-relu-logits__qGDxU6s', 'model-extraction-relu-logits__CskfjB9']",0,"[85.651858, 298.438904, 330.267988, 76.035923, 94.462799]","[31.423663, 166.109228, 23.137657, 41.972675, 13.412804]",0.0,False,[] +openai/gpt-oss-120b,mteb-leaderboard,5,"['f85dbfdc-dc8c-4516-b2b6-b1c35c5297f6', '15f0d58b-0edb-4c13-bd1a-d9e1b744c036', 'c0c7c72e-0298-4ec4-ad93-39631f1befb0', '322c02c4-bcc0-4158-a235-37f217ecdd04', '61d922bf-544a-4720-9433-f866f23d622b']","['mteb-leaderboard__sFbmpuY', 'mteb-leaderboard__5rvgj3T', 'mteb-leaderboard__b4i6Dwo', 'mteb-leaderboard__puDzF26', 'mteb-leaderboard__97Ya4Ui']",0,"[133.259922, 62.592313, 101.789268, 15.610789, 76.385778]","[20.979536, 5.364007, 4.721688, 10.861186, 31.980362]",0.0,False,[] +openai/gpt-oss-120b,mteb-retrieve,5,"['14de5547-a198-4697-8d0d-c151112df426', '4503f9c5-63a6-4e2a-b04e-6250752b491f', '50b51e0d-10d2-42c8-9acf-97eada281776', 'f293590c-d771-456a-8b24-c5cc2b11256a', '830c98de-9701-40c2-8c5a-0b6b04617d5b']","['mteb-retrieve__wwHY3FN', 'mteb-retrieve__W5jtJpW', 'mteb-retrieve__Svfg3kY', 'mteb-retrieve__5xqwUsn', 'mteb-retrieve__jYohWt5']",0,"[90.518879, 123.541305, 46.369117, 118.904306, 107.016436]","[112.968267, 111.397996, 8.252573, 32.072229, 2.958464]",0.0,False,[] +openai/gpt-oss-120b,nginx-request-logging,5,"['3d882f34-d6a5-4838-9b32-c13118dace70', 'bee85626-fc72-4c57-9109-f3019ca3e8b0', '8253e46b-2d9d-4330-91c2-a9b4e7f32f73', 'd8586f46-ff91-4510-8d7e-290639b1cccd', '5012fde6-6065-4285-902b-080179fcbfed']","['nginx-request-logging__R97bUdn', 'nginx-request-logging__Frod3Ab', 'nginx-request-logging__2JbE2Qc', 'nginx-request-logging__ahvuoCm', 'nginx-request-logging__DEN6Qus']",2,"[128.177112, 91.825849, 134.591175, 136.52262, 150.540703]","[27.889292, 99.771284, 17.640124, 31.261461, 164.198596]",0.4,False,"['3d882f34-d6a5-4838-9b32-c13118dace70', 'bee85626-fc72-4c57-9109-f3019ca3e8b0']" +openai/gpt-oss-120b,openssl-selfsigned-cert,5,"['101a70a4-b733-4429-87c5-d1145be51387', '6edbeb23-a268-4d4d-8b69-3470d7ee7fd8', '4e980c1c-bc29-4a88-a52c-2d2e2b3a4c0f', '0150b187-e0e9-4828-a85a-e1d6fa539f86', '87f93bdc-15b6-407a-9a72-63146b4e26ed']","['openssl-selfsigned-cert__27fZEBT', 'openssl-selfsigned-cert__TZTDPHD', 'openssl-selfsigned-cert__TVwW3BG', 'openssl-selfsigned-cert__Yn2U7GK', 'openssl-selfsigned-cert__BGx2g3k']",4,"[40.525633, 138.642155, 55.749684, 115.492058, 64.629051]","[52.282074, 17.48762, 23.722417, 41.761574, 28.265141]",0.8,True,"['6edbeb23-a268-4d4d-8b69-3470d7ee7fd8', '4e980c1c-bc29-4a88-a52c-2d2e2b3a4c0f', '0150b187-e0e9-4828-a85a-e1d6fa539f86', '87f93bdc-15b6-407a-9a72-63146b4e26ed']" +openai/gpt-oss-120b,password-recovery,5,"['6b7dbe2b-f483-47dc-8f83-cce61d6b8e92', 'b681f844-aaf0-4c6c-a787-f96ef4612a72', '19a1e6fa-f010-4109-8e53-dd1813cee283', 'dee41e04-1644-4de3-b5b1-c46cc1df7635', 'dc0a9d42-a91d-4aa0-b2f2-77ae7469bc84']","['password-recovery__3TC57LZ', 'password-recovery__RiEMUHt', 'password-recovery__UcAKvdt', 'password-recovery__hMRksnc', 'password-recovery__DGRsiCv']",1,"[367.672835, 107.874483, 907.98809, 900.797521, 409.378542]","[66.904768, 54.159016, 56.64711, 58.246171, 37.474756]",0.2,False,['b681f844-aaf0-4c6c-a787-f96ef4612a72'] +openai/gpt-oss-120b,path-tracing,5,"['2e1384ad-3a24-44aa-8735-33204c510876', 'ba279e82-1c1f-4a4f-bde4-8a32712c63d7', '9d16e901-6dc8-43ba-9b8c-a897c998ce5b', '9723b5f3-2249-4834-8d7e-4e4e6afe7cc3', 'c1bc29a2-e8d6-4d3d-95f0-6e1abd61a50b']","['path-tracing__aM2cszQ', 'path-tracing__nKnjGyy', 'path-tracing__J3hYYuM', 'path-tracing__PXZn9rT', 'path-tracing__86WTyxn']",0,"[205.974847, 327.615089, 160.948016, 990.240518, 241.042023]","[40.481991, 43.956246, 23.491011, 76.037486, 65.560554]",0.0,False,[] +openai/gpt-oss-120b,path-tracing-reverse,5,"['4470f1d3-f48f-4640-b5bc-a3a3d2ae4472', 'e58c4f52-1525-4447-be83-e8d6da9965f2', '6c7cf140-63dd-4bc5-b608-fbb0e4fff0fc', '64fc6129-ff1c-4c91-92d7-f69de3791968', '8d802c65-2d3d-4405-95cd-41887a0e4ac6']","['path-tracing-reverse__w2XRhYV', 'path-tracing-reverse__Qhe9aBi', 'path-tracing-reverse__JTN5bNY', 'path-tracing-reverse__az3VgaR', 'path-tracing-reverse__vqgkHpE']",0,"[1974.918343, 1816.060844, 1800.814695, 1333.044395, 1829.715037]","[14.924411, 33.010238, 59.215695, 81.73831, 63.377239]",0.0,False,[] +openai/gpt-oss-120b,polyglot-c-py,5,"['a1c69c39-b122-4744-940c-d1c081a286eb', '5a5234be-8a8f-442c-88c7-a2ad23935027', '9e6d9e23-84d1-49c3-ba09-fca3d1052210', '6e7bf554-2aac-4171-80ae-c1a60f52c095', 'b441002b-6138-4ade-bfc4-d2ff4d5e55d2']","['polyglot-c-py__nhTBZdf', 'polyglot-c-py__XumCJXM', 'polyglot-c-py__pD3U4Cj', 'polyglot-c-py__vCtXf98', 'polyglot-c-py__wDDwc6c']",0,"[117.740586, 276.857032, 900.698217, 178.844767, 89.113331]","[40.262632, 42.218543, 99.23711, 17.054292, 48.456092]",0.0,False,[] +openai/gpt-oss-120b,polyglot-rust-c,5,"['36866639-1694-4a12-8ef2-06869295a9e1', '9dbbaf1b-8b17-4c1c-9011-833f4e8a6193', '2eabf22c-5d87-47e9-a8bd-1cf0941e750b', 'b64ff970-4482-46ec-8071-b241fa3ac2dc', 'e4a7bb49-11fd-484b-a315-3def68640f46']","['polyglot-rust-c__gypEf2X', 'polyglot-rust-c__nVeW5Mh', 'polyglot-rust-c__CHXpCy7', 'polyglot-rust-c__d96oX73', 'polyglot-rust-c__tEM8vnC']",0,"[928.696927, 900.017479, 92.649689, 141.29147, 906.844519]","[26.092312, 64.516826, 121.1357, 97.339862, 290.624553]",0.0,False,[] +openai/gpt-oss-120b,port-compressor,1,['49ac1797-42a7-4927-83a7-4929eb4ebf97'],['port-compressor__C5mBN7r'],0,[3604.644179],[55.309683],0.0,False,[] +openai/gpt-oss-120b,prove-plus-comm,5,"['7f2ea6f9-620a-4ce9-b4dd-85defc41c11f', 'ef6d7c00-6f76-4581-912b-022185de56d7', '718c03e7-ba95-482f-a555-a8596b738b5c', '3c64f610-4a83-4697-8959-81374b14295c', '6a5d43a0-0fae-4a90-bb79-b4085d7023bb']","['prove-plus-comm__oQGWLmC', 'prove-plus-comm__wQaabho', 'prove-plus-comm__dyfgyr4', 'prove-plus-comm__o5S6gVw', 'prove-plus-comm__KhCDYDE']",5,"[141.927923, 289.439585, 41.834069, 192.563146, 36.75817]","[25.112397, 60.190224, 21.202708, 86.922415, 27.512835]",1.0,True,"['7f2ea6f9-620a-4ce9-b4dd-85defc41c11f', 'ef6d7c00-6f76-4581-912b-022185de56d7', '718c03e7-ba95-482f-a555-a8596b738b5c', '3c64f610-4a83-4697-8959-81374b14295c', '6a5d43a0-0fae-4a90-bb79-b4085d7023bb']" +openai/gpt-oss-120b,pypi-server,5,"['eb866939-d739-4f8e-a0cf-fd37f4f8918e', '0b4069cb-260e-478a-a508-01fbd6e5c766', 'a6f6e521-c229-467b-a291-fa4c6b624b75', '1ec8d952-441b-4aec-870a-800b991c14d9', '721d90f8-70b2-4531-9917-3920bb72ed12']","['pypi-server__sgZbv6b', 'pypi-server__6uWQwR8', 'pypi-server__iwoxZem', 'pypi-server__Xdueh2r', 'pypi-server__Ef4tB3V']",2,"[102.815255, 90.523169, 252.89447, 104.80126, 271.763319]","[81.176361, 62.552878, 62.460974, 35.259821, 14.369918]",0.4,False,"['eb866939-d739-4f8e-a0cf-fd37f4f8918e', '1ec8d952-441b-4aec-870a-800b991c14d9']" +openai/gpt-oss-120b,pytorch-model-cli,5,"['2659e60e-61c7-4b01-802f-d2b94ee8623a', '0b4a8c07-7eaf-4b86-9b48-4f89a88128a3', '6bd4f311-3a61-44eb-b4a8-f5aed32fac9f', '2ee9af8f-e91d-4a56-9ff8-64ca92b18ba7', '94ff821e-2677-4513-9a96-9738dd8271a9']","['pytorch-model-cli__5VtTjYi', 'pytorch-model-cli__zfAMdSk', 'pytorch-model-cli__dyXVT9f', 'pytorch-model-cli__w6RdbmM', 'pytorch-model-cli__QomSZRa']",0,"[126.826242, 29.613396, 35.28571, 225.341036, 117.514224]","[134.716261, 94.610271, 36.761746, 133.252919, 15.223506]",0.0,False,[] +openai/gpt-oss-120b,pytorch-model-recovery,5,"['c6abca5f-3cae-432f-a5ea-cd321f7540f6', '5007e0fb-fb40-47fb-a2e1-ac6ec308cbec', '684addef-1aa7-42b2-923c-1ddcd85cd084', 'be5c8570-3b01-42c3-8d7b-54cc7e571171', 'bfa8feba-2a79-4350-81f7-54801cfe3ab2']","['pytorch-model-recovery__KznWMFr', 'pytorch-model-recovery__Q8DqmBK', 'pytorch-model-recovery__w2Re4de', 'pytorch-model-recovery__yi6smN2', 'pytorch-model-recovery__dF7Xe2k']",2,"[306.707442, 82.945311, 348.259716, 900.968414, 903.385289]","[44.674445, 35.025304, 14.123545, 70.656638, 53.665857]",0.4,False,"['c6abca5f-3cae-432f-a5ea-cd321f7540f6', '684addef-1aa7-42b2-923c-1ddcd85cd084']" +openai/gpt-oss-120b,qemu-alpine-ssh,5,"['63c9e862-a49c-4e58-b91c-411f2b72b19f', 'b630e084-7e40-42a2-808c-86c20bc1a230', '0eea25f4-baf3-47ed-b4f4-048649ae57e7', '549550bd-347f-4b15-94c5-a923e2fba9ca', 'bf26c899-a265-41ce-b782-1bfc20651720']","['qemu-alpine-ssh__r5aJVUB', 'qemu-alpine-ssh__LaTgZvt', 'qemu-alpine-ssh__auZWT4H', 'qemu-alpine-ssh__zxL56yx', 'qemu-alpine-ssh__5quBKEi']",0,"[323.99536, 110.566921, 189.207552, 907.166709, 951.269345]","[9.761077, 4.665456, 4.212294, 25.419392, 10.081636]",0.0,False,[] +openai/gpt-oss-120b,qemu-startup,5,"['3659ca32-7816-423d-94ea-787521afc68b', 'c77ddb80-11d1-4cb8-bd57-29e8714e12cb', '28130f67-13a6-4840-a741-7d55d0380cbc', '6e206e4c-f793-41da-974d-28d2cb49d0db', 'f0169179-6e40-4386-81c2-1224307f8109']","['qemu-startup__b4cerNj', 'qemu-startup__bn9fTn6', 'qemu-startup__x9NZADh', 'qemu-startup__7MsJmLE', 'qemu-startup__qgxyWzv']",0,"[46.33987, 140.478451, 104.046084, 166.744352, 710.100094]","[30.638728, 18.368987, 11.908836, 6.284733, 33.195938]",0.0,False,[] +openai/gpt-oss-120b,regex-log,5,"['e68f4725-38ae-42b7-81e1-4f6c737e77d0', '4035013f-411a-4e6d-819c-523e0766d3ae', '84a92b61-e7e8-4c90-a517-ce3b29045974', '5ff3fb4c-94b4-49d0-b41b-a3afb32a4be5', 'd0958c42-7f97-4c32-b18a-5723277b808d']","['regex-log__C2YJ6ok', 'regex-log__wETMbF2', 'regex-log__hfALtWV', 'regex-log__bg9TyZc', 'regex-log__qVJqMpM']",2,"[82.229762, 48.991195, 73.696373, 74.322783, 106.013093]","[97.158379, 190.348078, 76.581372, 133.210862, 65.082783]",0.4,False,"['4035013f-411a-4e6d-819c-523e0766d3ae', '84a92b61-e7e8-4c90-a517-ce3b29045974']" +openai/gpt-oss-120b,reshard-c4-data,5,"['101724e9-43a8-4fd2-ac39-fa24325ebfe8', '928f7549-3088-44e1-8527-b7e0dc56f3a9', 'e3dbbb46-2c7c-437b-8581-43761667d6d1', '3d291e52-6166-417f-bd3e-9cd296d5dcba', '4c6df88d-e11b-4190-9d5e-9a05ff440c20']","['reshard-c4-data__VCSRMXD', 'reshard-c4-data__9DCBAQt', 'reshard-c4-data__gueZPpX', 'reshard-c4-data__TDEYNUH', 'reshard-c4-data__cF6Dnau']",0,"[904.945609, 199.423086, 529.4665, 324.155524, 163.610161]","[150.60071, 44.647021, 91.192046, 20.315782, 62.750314]",0.0,False,[] +openai/gpt-oss-120b,reverse-engineering,5,"['6fe11f90-0267-4a81-84ff-10eb804a4884', 'be1fcab7-d515-41e5-a3cf-f5fd422fd565', 'c1f9e8d1-c0c4-4ed5-ab5a-98dea645467c', '754df405-0db1-4e46-807b-959f2fa530a7', 'ba379ce3-ad2f-47ae-94b7-890311dd4d7f']","['reverse-engineering__tGmuHo7', 'reverse-engineering__2HYD7uA', 'reverse-engineering__pDRDtGF', 'reverse-engineering__huhq6wi', 'reverse-engineering__M9qtLBY']",1,"[1804.178101, 923.221569, 1800.043933, 1801.939504, 1802.649992]","[29.652014, 64.987013, 25.546832, 16.631648, 38.965834]",0.2,False,['be1fcab7-d515-41e5-a3cf-f5fd422fd565'] +openai/gpt-oss-120b,run-pdp11-code,5,"['021f04d4-4b5a-4be4-9059-ed79174016fc', 'faad540d-dbfb-45a3-9ffb-9caa3a099580', '5288c6f2-556a-4003-95e7-60791d392cde', '432ad616-576f-48b7-b8fc-82fef748ffa1', '26094bb4-1976-4d2d-b45c-b91dcc088929']","['run-pdp11-code__BY3sNr6', 'run-pdp11-code__DuuynKP', 'run-pdp11-code__r3iTUvJ', 'run-pdp11-code__FQEf8vp', 'run-pdp11-code__UQAgweR']",0,"[202.563766, 291.149648, 234.588641, 1095.415645, 275.998361]","[20.081074, 18.661669, 58.784153, 274.153045, 104.573179]",0.0,False,[] +openai/gpt-oss-120b,sanitize-git-repo,5,"['e51def54-c337-488b-ab93-403a9ac03bbd', 'f5d40646-39de-420c-86f3-af650d44e9fd', '569e2afa-1b3b-4705-9d79-403e7a9d9b7a', '9d1bc831-2e1a-4400-8e2e-e86ff75330c0', 'c4d1cce3-76f9-4e3e-b409-156261d2c435']","['sanitize-git-repo__JBSwSau', 'sanitize-git-repo__TTF3Wgo', 'sanitize-git-repo__PzWTtAU', 'sanitize-git-repo__8Bxa3mc', 'sanitize-git-repo__RdKPq9G']",0,"[148.139276, 145.117085, 93.422444, 529.431522, 226.641051]","[52.901878, 28.718699, 306.440165, 182.614518, 65.470006]",0.0,False,[] +openai/gpt-oss-120b,schemelike-metacircular-eval,5,"['81455380-ab27-40c8-95c0-5119d8b0a9b6', '43bda7f4-0edd-4200-aa9c-267cf18fe3c1', '1ddf7e9c-7a29-4b40-8935-39f3c02f10cc', '534db045-118e-4154-aab6-503de0e6d2c2', 'fda7af6e-37d3-4539-8f51-08e0aa759d01']","['schemelike-metacircular-eval__Zh5CqEm', 'schemelike-metacircular-eval__fqmWQAU', 'schemelike-metacircular-eval__WyZiSHW', 'schemelike-metacircular-eval__NFijk5Q', 'schemelike-metacircular-eval__bnTZF2f']",0,"[284.288081, 225.855565, 2400.033948, 277.201498, 96.662482]","[56.473595, 39.420174, 24.10915, 39.613702, 25.024817]",0.0,False,[] +openai/gpt-oss-120b,sparql-university,5,"['949a7f4c-8af3-4cdd-86ff-0aa5c51bab27', '4f7938f8-d277-433b-9663-96df7fc2f290', '2e52b47e-3ccc-441b-9ca5-2a6b3d4c3b13', '95dcd984-798b-4428-aefa-c0367feaaefa', '8e6d32d4-c45c-4db4-a123-4685dbe95f97']","['sparql-university__NSnRaaq', 'sparql-university__R2pkipV', 'sparql-university__6z6GE57', 'sparql-university__ePJp5zU', 'sparql-university__An8iCQG']",0,"[55.441049, 91.231956, 135.395173, 138.075652, 92.636642]","[31.769832, 134.80829, 41.483706, 87.604478, 80.715817]",0.0,False,[] +openai/gpt-oss-120b,sqlite-db-truncate,5,"['e6c8abcb-daf4-4127-871f-2215a4557d21', '5e096801-1e42-4c90-9da0-8e37ad48c35a', '9f49ab87-9a5d-4f70-a52f-cd6c6584c039', '8b14f17c-3f53-44ba-a659-04f02e2db82b', '924eeac1-571a-4f91-b076-8f7448c6cc8e']","['sqlite-db-truncate__VJzti93', 'sqlite-db-truncate__tMwqEar', 'sqlite-db-truncate__M4cmhAF', 'sqlite-db-truncate__enzsNjG', 'sqlite-db-truncate__ymfYSo5']",0,"[160.282328, 321.21476, 347.02981, 798.021671, 902.514742]","[29.94234, 47.90702, 103.156202, 29.041676, 68.416642]",0.0,False,[] +openai/gpt-oss-120b,sqlite-with-gcov,5,"['31b9b3bf-c77d-4ac8-a92f-e11fdd001ce3', 'dcb980fc-3489-45d7-a06e-8364d34ab8f0', 'cd9a98f2-458b-485b-b83b-91fab1989bc3', '72ff3a25-d182-4c34-a2dd-ae5a9b8d765c', 'b3e296e4-824d-4dbc-af37-0729ce40ce4b']","['sqlite-with-gcov__y6cojfe', 'sqlite-with-gcov__LGocTpS', 'sqlite-with-gcov__WMooaYN', 'sqlite-with-gcov__2NMvHFx', 'sqlite-with-gcov__EgdiZ49']",4,"[408.31915, 160.96343, 241.021303, 373.045597, 247.866984]","[60.960212, 18.640138, 62.094527, 129.680533, 30.560483]",0.8,True,"['31b9b3bf-c77d-4ac8-a92f-e11fdd001ce3', 'cd9a98f2-458b-485b-b83b-91fab1989bc3', '72ff3a25-d182-4c34-a2dd-ae5a9b8d765c', 'b3e296e4-824d-4dbc-af37-0729ce40ce4b']" +openai/gpt-oss-120b,torch-tensor-parallelism,5,"['d8c266c5-877c-471c-a8ae-9ac1335dc80a', '0a6c2940-b35f-40b9-813d-e2adc824a2de', '3dbd774d-c9d1-4c47-a26a-aebf98a287b5', '46fd2c8a-b6a2-4cfd-b783-7599c0d4faf0', '0774f36f-e195-49c5-af0e-6d912cddd63a']","['torch-tensor-parallelism__hvvfdLk', 'torch-tensor-parallelism__85KJxxc', 'torch-tensor-parallelism__gcyvHV3', 'torch-tensor-parallelism__me7qscR', 'torch-tensor-parallelism__xUzvaZp']",0,"[78.420052, 53.688934, 574.500412, 590.599073, 49.128307]","[47.706958, 54.387003, 47.794043, 111.253885, 26.792423]",0.0,False,[] +openai/gpt-oss-120b,train-fasttext,5,"['e427563b-6a0b-496a-81c2-19b1e8d77054', '6e747ca1-f4aa-4db0-8116-0eefe733abaf', 'd27e35f2-1de1-49b6-8dd3-048c9333b51e', '02ebafac-a700-42de-a694-c404cc486503', '526f3558-0eee-4a97-b076-85f32773170b']","['train-fasttext__Qnpcn8x', 'train-fasttext__opiU5hE', 'train-fasttext__Fj9FgPk', 'train-fasttext__ivfkHxy', 'train-fasttext__LJCKsDS']",0,"[1430.868638, 1404.93066, 3606.177206, 3601.413439, 3625.486346]","[31.099879, 62.958705, 19.914682, 39.143102, 15.657987]",0.0,False,[] +openai/gpt-oss-120b,tune-mjcf,5,"['891564a4-b4ae-41c9-8a79-7d93d786baef', 'ec929e5c-ba62-482e-b0aa-3f85ba5bb945', 'bbbc214a-913a-4840-a2ad-ca3a8746561b', '09364e83-3dd8-4e19-97db-8ddc3dd21e60', '22285a78-4e32-4db2-aed1-a9c42d4e339d']","['tune-mjcf__DP86NXv', 'tune-mjcf__bdkkdSC', 'tune-mjcf__oBWeE2r', 'tune-mjcf__qX25R7F', 'tune-mjcf__FXX6xQq']",1,"[904.484652, 926.456411, 907.71481, 707.803744, 954.618012]","[25.005458, 17.518841, 15.972874, 8.370998, 24.537049]",0.2,False,['09364e83-3dd8-4e19-97db-8ddc3dd21e60'] +openai/gpt-oss-120b,video-processing,5,"['366b9c98-329c-48a9-91dd-1cebf50935fc', '004b95f2-95d2-4346-98f1-65de9221a60b', '19f8b9fe-a1fd-40ea-84e1-16d498115663', 'b867e9ba-5abd-45e1-bd76-79d5ed8e5285', '9243aa47-ecd9-47ac-8dbf-56a39c956566']","['video-processing__UuvAt77', 'video-processing__TdKsgPD', 'video-processing__4nKJX49', 'video-processing__sBmqSMs', 'video-processing__Vs49vs4']",0,"[75.652025, 62.642712, 49.491286, 481.845186, 112.399611]","[134.562022, 21.167477, 12.931619, 67.16024, 52.473265]",0.0,False,[] +openai/gpt-oss-120b,vulnerable-secret,5,"['15456c0d-f3da-420d-b59d-055c91915343', '9c4ba46a-0d68-438f-9054-586208a13874', '44aa0c21-5e5f-4a62-a476-40c8430acb51', '06ae0449-cb21-42bb-b9d0-7044203d03c5', '2a893b34-3159-499d-ad5c-5cd04f69800f']","['vulnerable-secret__NZNaezj', 'vulnerable-secret__5jhV8D9', 'vulnerable-secret__NkZuGfu', 'vulnerable-secret__8fshYxf', 'vulnerable-secret__hUmAcAC']",0,"[905.258086, 901.435665, 303.773106, 382.465756, 909.075465]","[15.799635, 64.541968, 11.327245, 24.929803, 31.843394]",0.0,False,[] +openai/gpt-oss-120b,wasm-pipeline,5,"['53b91d78-bd4c-402c-a2d6-498aafbf5b5d', 'f9df35ff-19b3-4af2-abf4-2e04081fcee2', '5033897a-554e-4b19-95b1-d604d04c8dc7', '7c3c2db3-61e1-429e-9c59-316b6f963a11', '5fcb4894-caaa-4ee4-9135-30c95cdfa6a4']","['wasm-pipeline__6KL9rDZ', 'wasm-pipeline__GPr8YGr', 'wasm-pipeline__i95BZBW', 'wasm-pipeline__WTEhytR', 'wasm-pipeline__2oL8Uss']",0,"[34.906796, 903.444879, 225.762332, 345.992577, 925.35537]","[22.028468, 21.086678, 9.80045, 19.784564, 12.198092]",0.0,False,[] +openai/gpt-oss-120b,winning-avg-corewars,4,"['667236fa-ea82-4c71-9fd0-ed933c887f36', '1b938b55-f019-4f28-a957-ca52037f1a7e', 'd082fe58-69a8-4b5d-b0b9-b31b64431875', 'a27ea156-8698-428e-8524-4231144328f1']","['winning-avg-corewars__c4nCYyz', 'winning-avg-corewars__t73TNHp', 'winning-avg-corewars__hfTudNi', 'winning-avg-corewars__ehsaNZR']",2,"[1380.136805, 1742.693082, 847.490415, 117.953503]","[23.666631, 4.853928, 4.622614, 83.872405]",0.5,False,"['1b938b55-f019-4f28-a957-ca52037f1a7e', 'd082fe58-69a8-4b5d-b0b9-b31b64431875']" +openai/gpt-oss-120b,write-compressor,5,"['ab3bf2da-d401-4778-893e-6187b4f73086', '41c5dc24-dfae-4084-9527-668b34920f0a', '4330392c-1bb9-4051-b220-b1a81b8742b1', '8a89b0a1-41f0-451f-a839-06e15dc9bee6', '1400e1a7-4021-4e2b-985f-1733042c1165']","['write-compressor__JwXkPQD', 'write-compressor__cCcZWnz', 'write-compressor__gDKBqBR', 'write-compressor__QDBJ2xK', 'write-compressor__AVgeHjr']",0,"[200.664599, 901.886255, 1224.669908, 900.034653, 826.793061]","[26.327616, 106.403589, 231.241986, 68.130563, 38.808455]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,adaptive-rejection-sampler,5,"['d0598434-de08-40ad-b769-c5f1234561a9', '2be26b05-3333-478c-afe2-b2acdc76c0b1', '0f2bae12-7846-4c95-be69-4cfb7d4428b2', '7700b12c-dfe8-4f41-93b9-64581dd40a6f', 'a999cabe-63c6-498f-901b-1c6bf92f713d']","['adaptive-rejection-sampler__M57v2GV', 'adaptive-rejection-sampler__picjvi6', 'adaptive-rejection-sampler__g2gvoSK', 'adaptive-rejection-sampler__KMoGZiY', 'adaptive-rejection-sampler__5RRekWV']",0,"[903.992176, 903.037236, 900.006828, 900.549711, 912.631231]","[56.489563, 35.131243, 18.101052, 324.740352, 32.021445]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,bn-fit-modify,5,"['c9d9ef1d-5312-4365-8b44-93d143d8df84', '3d272d79-ba69-4495-b298-831b4c4ce340', '2880e3b8-6709-4818-b186-a00f298614f9', '717bde28-03f3-4aeb-b8b6-13fbc007aec1', '3f795318-9191-4fdb-83b4-88ead1e0d1c4']","['bn-fit-modify__K7yUELL', 'bn-fit-modify__S4aGW4A', 'bn-fit-modify__WxAEmDc', 'bn-fit-modify__wWbVjSi', 'bn-fit-modify__LTwTuUG']",0,"[661.523861, 657.684522, 902.013699, 978.36311, 2540.058613]","[21.314179, 65.144863, 116.580282, 180.183497, 14.923045]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,break-filter-js-from-html,5,"['82206198-4a21-4b5c-a190-7b53c7efdd9b', '010be9ab-f73d-4825-a6c3-20de731068c2', 'f3fd64ee-c6da-4daf-b4e9-10bda5a18f58', '9b4d2167-867f-4846-b762-6476f4d17ac8', 'ee895e13-0c39-4d00-b6b8-9173df0f3fde']","['break-filter-js-from-html__xG5aE8g', 'break-filter-js-from-html__9XQ2eWs', 'break-filter-js-from-html__odysNvF', 'break-filter-js-from-html__enSDWFg', 'break-filter-js-from-html__wd69qF8']",0,"[424.310438, 166.897669, 340.818113, 1210.775896, 768.959523]","[123.140385, 29.973002, 16.233107, 27.53015, 41.260181]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,build-cython-ext,5,"['f59ad4df-ecb8-4e78-a851-ac3693341911', '0a93f725-4c04-4520-b674-abfb4666cf96', '81b55edd-b648-4967-aefd-4559416e5ca0', '63d234a3-5e5c-4d44-b55c-891a3269df5d', '36fc82e0-4a1a-4e1d-b1cb-0a06218551e4']","['build-cython-ext__Pu4aARG', 'build-cython-ext__yypF72p', 'build-cython-ext__9zEZ2EK', 'build-cython-ext__eggKSRg', 'build-cython-ext__CTxZWjy']",0,"[900.027686, 923.791429, 902.36444, 900.006475, 595.879952]","[180.513952, 19.830433, 124.897922, 134.25737, 65.102456]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,build-initramfs-qemu,5,"['81dd5a03-18a1-47be-b176-b2ecb592c3a5', '180ef646-0896-48be-96db-f96a58ff4dcb', '6b44baac-48e9-4290-819a-c9a58bb81d1a', 'ad0752fc-e8fb-4647-aefd-387f1b0ffd4f', '87832daf-8d14-4806-a704-3530a25daa3b']","['build-initramfs-qemu__9Jhs8yA', 'build-initramfs-qemu__cgEpuNQ', 'build-initramfs-qemu__WHhJrSq', 'build-initramfs-qemu__vWTzQXc', 'build-initramfs-qemu__8FnMKqy']",0,"[85.91385, 909.26996, 447.428323, 284.491387, 144.180436]","[12.035722, 59.096345, 156.032642, 103.348298, 25.205842]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,build-pmars,5,"['7fe73d27-fcbe-4ea0-8a3b-14b5e50aa7ae', '6bb19af1-6995-41e3-bb84-0f7cf04ebf22', '1faee519-791d-436a-931e-d27ea1245c0f', '5bcf5723-8b8f-46f3-b65b-1ab7c0008e20', 'ee5c1bc9-dde1-4c01-9f47-65674d197acc']","['build-pmars__UFJVHV5', 'build-pmars__HoMGtVD', 'build-pmars__3sa3CEd', 'build-pmars__TxuKjno', 'build-pmars__abedQTU']",3,"[792.382754, 671.288101, 904.272271, 196.1096, 439.080494]","[16.855271, 7.54895, 20.59521, 2.877599, 4.788029]",0.6,True,"['7fe73d27-fcbe-4ea0-8a3b-14b5e50aa7ae', '5bcf5723-8b8f-46f3-b65b-1ab7c0008e20', 'ee5c1bc9-dde1-4c01-9f47-65674d197acc']" +zai-org/GLM-4.5-Air-FP8,build-pov-ray,5,"['64b0f6c2-ddff-40b2-b7f8-f13f58175153', 'b5caf698-964c-484d-a268-a635553496c1', '38a2f1fc-0a22-4cac-bf70-5a68310607aa', 'fc560f56-a0e3-4f94-8d24-1b0420f273e6', '90e44b13-db81-454d-a0b6-75396a5916e7']","['build-pov-ray__d7G3r5m', 'build-pov-ray__bRgVUo9', 'build-pov-ray__mj4GZ7S', 'build-pov-ray__uB7ggtu', 'build-pov-ray__tUHwU69']",0,"[2846.885745, 857.452523, 1701.299445, 822.825175, 804.24679]","[34.128657, 22.686526, 51.865878, 110.598551, 57.426374]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,cancel-async-tasks,5,"['ce366a9d-36b9-4ad0-af44-038e7394fdf5', '61c6b66d-acfa-447f-9815-abb99f588e43', 'e62d30a4-2f82-4ad7-8b4a-380a802a1e6e', 'f9df8f65-4ad8-4f2a-9646-f3267652e4a9', '3fae39ad-14b7-495a-8c76-02cade4e259d']","['cancel-async-tasks__TTGYmr5', 'cancel-async-tasks__SmxCpFD', 'cancel-async-tasks__m9UWTNt', 'cancel-async-tasks__EnhdDPt', 'cancel-async-tasks__ikHN3yg']",1,"[27.84011, 170.509257, 185.145985, 204.080652, 94.816883]","[72.092223, 40.491055, 170.406393, 68.021387, 60.579117]",0.2,False,['ce366a9d-36b9-4ad0-af44-038e7394fdf5'] +zai-org/GLM-4.5-Air-FP8,chess-best-move,5,"['a548e08d-8e9f-4998-8722-3e2b6f47afdc', '30c39365-b589-4068-a684-50617e917c37', '6bc7e090-9c8e-45ad-a37e-b4087fa84c5a', '210864df-ec02-4e28-bfec-cc844c5994fc', '88066c6f-9bb7-4901-aa6f-40c62f75d8db']","['chess-best-move__pYaSkBp', 'chess-best-move__nQMWN6t', 'chess-best-move__9EdP7XX', 'chess-best-move__DcPgzt8', 'chess-best-move__jjVhWet']",0,"[509.512858, 632.160736, 815.436121, 728.487402, 824.135439]","[12.992091, 335.365449, 117.6577, 6.003035, 57.650835]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,circuit-fibsqrt,5,"['0d5a2add-a3a9-4d77-9cdd-1ba8a2903d3d', '257d5b40-f86a-4c2b-be54-78e1215ab6b9', '4cd74840-f383-42ca-b550-aaec276bceff', 'e7cc511b-f33d-4a36-89ce-76d36801ca40', '0c33b640-b2e5-487e-8fd1-70e77c7fb4b1']","['circuit-fibsqrt__XKMJrWY', 'circuit-fibsqrt__F8LqeyW', 'circuit-fibsqrt__v4EFfRa', 'circuit-fibsqrt__hjzBNRD', 'circuit-fibsqrt__szJZnjc']",0,"[1501.638539, 2126.641662, 1594.485598, 3605.875561, 3604.425977]","[14.31499, 52.062557, 42.205601, 34.154215, 1273.808619]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,cobol-modernization,5,"['25696c0b-e73c-489b-9e3e-39f809321d9d', '7e8812f1-a339-4fde-9000-e9f444056788', 'fa83b1c4-cf59-4efe-ae1f-3f3d9f935f3a', '20a6a7f0-0098-4f8b-98f3-0e0fffb04342', 'eb846e6b-ae92-477d-97d0-31a0aa87ef36']","['cobol-modernization__V5Zzdna', 'cobol-modernization__MRfZ4sQ', 'cobol-modernization__SpsMC5s', 'cobol-modernization__FAVA8hK', 'cobol-modernization__nVVFdMz']",2,"[918.676874, 396.241093, 446.492221, 902.880442, 922.902224]","[83.152149, 52.492487, 52.403768, 21.38447, 47.871375]",0.4,False,"['25696c0b-e73c-489b-9e3e-39f809321d9d', '20a6a7f0-0098-4f8b-98f3-0e0fffb04342']" +zai-org/GLM-4.5-Air-FP8,code-from-image,5,"['15c0dbd1-92fa-4797-b9de-276d837c204a', '05e82edc-e480-4112-8c51-1004cf27052f', 'a1858cc5-7c88-4858-ba02-1e84f2695806', '01e1fd5d-74d3-4bb1-bab1-960864d0b1f9', '9eec53de-11ab-45ed-b74f-af37fde9e9fd']","['code-from-image__fnBdEGL', 'code-from-image__qFQLfpQ', 'code-from-image__uy658HD', 'code-from-image__kMimj9Z', 'code-from-image__eVF4yh7']",1,"[584.150479, 1150.170613, 1224.048082, 844.295601, 276.399463]","[25.021884, 59.013846, 70.924967, 27.926323, 42.31006]",0.2,False,['9eec53de-11ab-45ed-b74f-af37fde9e9fd'] +zai-org/GLM-4.5-Air-FP8,configure-git-webserver,5,"['40616c3c-a933-455c-891e-71a20c379e9c', 'a0d29ae7-835f-4fb4-8de4-076a8d10dba3', 'feec636a-19bd-45ec-be2b-47680f32dd44', 'd3fcc935-7551-4958-a2c7-a5126341affb', '34523b03-4d0a-4378-a7a5-4bfbfdc0b2cc']","['configure-git-webserver__rHqKDcd', 'configure-git-webserver__cnhsfQz', 'configure-git-webserver__seo8wxN', 'configure-git-webserver__J642pef', 'configure-git-webserver__TppA3fr']",0,"[788.794964, 300.760405, 321.276225, 926.116323, 260.746594]","[41.366926, 59.469004, 19.382531, 157.433204, 16.161384]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,constraints-scheduling,5,"['ca358afb-ab6e-452c-8dd2-534056b29c16', '148480b3-7dce-400e-8a8c-7f65956c58f3', '2c9e6ad1-f533-426b-a6fd-932ca3c937f1', '52995888-e2ab-4bff-9bdb-6a54fe5404c8', '451e5156-cf86-4745-b6eb-fbaae22e6a02']","['constraints-scheduling__86j2j88', 'constraints-scheduling__YuQQWi8', 'constraints-scheduling__U3RrNE8', 'constraints-scheduling__KVkzFSC', 'constraints-scheduling__aJmHmPh']",4,"[458.157091, 516.868172, 400.99791, 360.917783, 577.996644]","[36.508253, 141.699001, 61.693998, 25.314239, 48.856694]",0.8,True,"['ca358afb-ab6e-452c-8dd2-534056b29c16', '148480b3-7dce-400e-8a8c-7f65956c58f3', '52995888-e2ab-4bff-9bdb-6a54fe5404c8', '451e5156-cf86-4745-b6eb-fbaae22e6a02']" +zai-org/GLM-4.5-Air-FP8,count-dataset-tokens,5,"['d8cc0b61-15c9-42ec-bebf-f4ef420826f2', '33a4bf0a-f6e5-4379-bde2-b971cbdf6317', '5d8b5329-94db-490f-9f86-9e4965f82d75', '41f19d9b-0fc9-4c01-be8d-a4d61e45585b', 'ebc95ba1-88f2-4d35-acac-43692742a910']","['count-dataset-tokens__ph9xHfQ', 'count-dataset-tokens__rEjMgPJ', 'count-dataset-tokens__uxrpVaj', 'count-dataset-tokens__rF68orD', 'count-dataset-tokens__9veRvR9']",0,"[905.280255, 920.351024, 246.060796, 588.420629, 605.313678]","[15.897979, 134.026788, 18.156761, 84.052646, 21.135558]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,crack-7z-hash,5,"['be58f30a-9afd-40db-b1e7-97ed9f50def6', 'c6d53bb7-5b70-4dfe-a7fe-cfb32ed99f50', 'dab6079e-9216-41a5-8bcb-a520c600c34f', '815c3e02-432b-4731-bfcb-6c12f69a8b21', '22d89426-a089-451a-af11-74b7b3807e91']","['crack-7z-hash__PbymwQx', 'crack-7z-hash__eUxedaT', 'crack-7z-hash__ZYhEhMY', 'crack-7z-hash__xhieu5w', 'crack-7z-hash__fBKy9bR']",0,"[900.033434, 900.266514, 904.448797, 900.763471, 900.99169]","[29.855881, 10.69311, 15.788835, 26.665131, 24.533238]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,db-wal-recovery,5,"['e2113bfb-9d33-4d24-a0c8-26f95f4e9b77', 'f87c9eb5-d29a-4370-ab86-5ce30b1686b6', '1be98eea-b9ea-4d38-a068-9d93efe202f7', '5a865dfe-904d-40eb-8cf8-5673296c732a', '084c53c7-2bba-42f8-b2c2-d848c47b27b5']","['db-wal-recovery__xLAPPJC', 'db-wal-recovery__MhrxQoG', 'db-wal-recovery__wqHtKng', 'db-wal-recovery__ET94UTg', 'db-wal-recovery__c9FdSeJ']",0,"[910.990073, 120.651215, 321.451714, 910.573184, 740.996391]","[57.248871, 8.640963, 50.601008, 57.191341, 27.30205]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,distribution-search,5,"['a6758dfd-81fb-4284-9ffa-61ba5dbe32e4', 'f7f96947-2a27-4a59-9a6d-577adb52ad40', '3448513f-6dac-40e2-9bfe-6b8d08f98d2c', 'a8df12f3-9ecf-49c4-88ca-91d63b4851db', 'dfc9658d-b782-4ac2-9dbf-f521957733bb']","['distribution-search__VcqDhRu', 'distribution-search__FMJPy5v', 'distribution-search__uKgAtxL', 'distribution-search__JeYffuy', 'distribution-search__JektXia']",0,"[877.421695, 738.994043, 508.107931, 263.069871, 1558.271111]","[208.712291, 55.260479, 119.969694, 12.205077, 63.981261]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,dna-assembly,5,"['96664f21-195e-4a7f-903d-46ec1162f93a', '443f9ee5-c3ad-4fa0-8725-22529aa36592', 'bd7d739f-98b2-4161-b93d-da3aaf622bec', 'dd3f0803-762c-4bb7-a858-de4dec4dd99e', 'a57502a1-ff23-4bcb-bc69-6f7fc14f6158']","['dna-assembly__ZjqX9TP', 'dna-assembly__BUvrHzt', 'dna-assembly__AB7VMuQ', 'dna-assembly__Vdpun46', 'dna-assembly__9LCbbG5']",0,"[722.096251, 644.52054, 531.922187, 721.467656, 738.761843]","[28.170278, 41.579921, 33.177886, 58.406237, 35.412562]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,dna-insert,5,"['7230fdbc-86d7-469d-9b95-079236efd67b', '640c6edb-f40e-4380-86d9-438f9e24839d', '540275ce-c236-41ad-bd36-1aff908fa555', '27fdaa4e-3636-4e9c-b53a-51d99fb32f46', '6da7bac5-6b1f-4459-915d-ce0e98535ed0']","['dna-insert__4PsTQTF', 'dna-insert__NAoyW5H', 'dna-insert__9dEvd7M', 'dna-insert__xpAvswu', 'dna-insert__vrPgfVM']",0,"[419.1406, 617.783595, 379.011423, 361.682963, 360.083575]","[26.902594, 331.059928, 13.810891, 50.377705, 332.70983]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,extract-elf,5,"['21b2037d-6b8c-4d01-9401-17e28f2ed86d', 'b58fbf32-6dc4-47e9-aed2-5ced4fd17880', '7cad8e0b-1d4e-4f93-91ee-8e159207e8eb', '64883f75-7897-4421-b301-987f0bd30455', '6052188c-823a-48ef-a026-17a9b0918138']","['extract-elf__QFTiaej', 'extract-elf__Lqomrcd', 'extract-elf__h7uVA44', 'extract-elf__KhdjG2e', 'extract-elf__nxZkqhX']",2,"[232.990402, 382.428815, 219.024964, 202.807915, 375.939295]","[106.994185, 64.298298, 58.34759, 38.048787, 98.249937]",0.4,False,"['7cad8e0b-1d4e-4f93-91ee-8e159207e8eb', '64883f75-7897-4421-b301-987f0bd30455']" +zai-org/GLM-4.5-Air-FP8,feal-differential-cryptanalysis,5,"['59f7fa95-f3be-4423-84b3-734348f6ff66', '1cacca91-de7c-49fd-9523-7f3daa0bec69', 'deb156e6-22a8-48cc-a753-bef7546cf845', '93a64d85-0ac2-4f68-bd4c-ffe172219c49', '43009783-ed25-4a4f-a6f8-e484af7ec17b']","['feal-differential-cryptanalysis__civXULT', 'feal-differential-cryptanalysis__mx2Ciwd', 'feal-differential-cryptanalysis__tVPrjin', 'feal-differential-cryptanalysis__dxA9V3d', 'feal-differential-cryptanalysis__snEgK8d']",0,"[171.561258, 55.728406, 799.657608, 140.430419, 253.085367]","[268.712158, 37.43228, 17.67697, 179.97289, 246.997765]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,feal-linear-cryptanalysis,5,"['c788a979-4c22-4679-9638-433a205d9b27', 'f0f64979-e489-49dc-85a1-fe1cbc592a79', 'fc2416d9-465b-445d-aa6d-960f885722e8', 'b785de13-5968-4e49-8825-ed9a5deb3571', '88c78970-7a52-476f-91d3-f1ad5ee2831d']","['feal-linear-cryptanalysis__oP6Tsvy', 'feal-linear-cryptanalysis__QeEr2Kq', 'feal-linear-cryptanalysis__roNaGgA', 'feal-linear-cryptanalysis__HXLgqBf', 'feal-linear-cryptanalysis__FN7Yp95']",0,"[1822.693658, 1806.338421, 1260.432391, 440.10435, 1075.059699]","[39.99521, 75.744122, 42.319807, 98.308208, 21.320025]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,filter-js-from-html,5,"['11446b26-35c5-4cc9-a4ae-eec840dd62ce', 'b555076b-e922-4a59-aa94-4380848ac011', '2533a021-8594-429f-a203-99bcf8485608', '0e3d4a47-9082-4c27-b3f3-9129eaae9cdf', 'c0486381-bd53-4051-b66c-973c25422379']","['filter-js-from-html__kZTYqbb', 'filter-js-from-html__7unhF6A', 'filter-js-from-html__kVndorL', 'filter-js-from-html__FWLX6Mn', 'filter-js-from-html__tKiWzg8']",0,"[128.306812, 949.654966, 805.143316, 35.26487, 900.773719]","[46.935825, 29.706106, 29.813243, 33.647616, 49.624109]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,financial-document-processor,5,"['3dd1acc3-56b0-42c5-902a-0c0d3a7955f5', '74a87cbc-94ad-4fa5-b828-3b7a5b755a5e', '8a533501-ab8e-4a53-a5f1-e7fe1b65f2f6', 'de4ab92a-a3cb-4ce9-9b6d-6320e1337e40', '6673573e-76a4-4470-bc75-21c73872264e']","['financial-document-processor__k39NdXG', 'financial-document-processor__rBLnijo', 'financial-document-processor__aBHqfog', 'financial-document-processor__9ECDgnV', 'financial-document-processor__c2w3bPB']",0,"[120.205635, 1200.000845, 1202.196976, 413.321093, 193.760596]","[131.066778, 57.441674, 78.635276, 21.501885, 233.397057]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,fix-code-vulnerability,5,"['2a44b8e0-c44d-4d28-91f6-f48ded348133', 'b8a2939b-6f15-4946-be28-9acca4d43b30', '5f1d3157-e56b-481d-b703-97aca3d9908c', '15e6a4da-5f5f-44c7-ab4f-31495d6aeee2', '57d2b30a-0d1a-4531-babe-444bf4b2f64d']","['fix-code-vulnerability__MGy52GT', 'fix-code-vulnerability__ZwbvxLb', 'fix-code-vulnerability__XAc4JBL', 'fix-code-vulnerability__johjkxr', 'fix-code-vulnerability__4zc54wg']",0,"[503.604219, 423.313306, 907.45893, 1034.219472, 250.674926]","[8.085752, 34.347224, 10.599085, 10.656009, 14.58586]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,fix-git,5,"['680286e7-125b-4569-b57c-1b81ffa58f22', 'bec4d01e-0376-40c4-bb79-f792629980f0', '9b7621f6-5cda-4e2b-bfdb-27719499abc8', '1f72b7a6-faaa-4d08-9cff-68c142c80902', '171624f6-7681-47a6-830f-0ebd546b2047']","['fix-git__4D3bTTT', 'fix-git__iPmBwCu', 'fix-git__2V2WdsM', 'fix-git__8CApRNH', 'fix-git__g7a9r9X']",3,"[56.829034, 101.819031, 241.068161, 902.426968, 920.482572]","[14.126865, 16.948387, 52.561449, 48.604066, 54.926383]",0.6,True,"['680286e7-125b-4569-b57c-1b81ffa58f22', 'bec4d01e-0376-40c4-bb79-f792629980f0', '9b7621f6-5cda-4e2b-bfdb-27719499abc8']" +zai-org/GLM-4.5-Air-FP8,fix-ocaml-gc,5,"['0f5d7c35-30bd-4b76-8698-e7a9906affe5', '8ac03aaf-6f58-4c7f-a77e-f77bc85c9faa', 'c5869034-8b6b-4712-8cdb-41fe3f395368', 'd952d7a4-2aa4-4256-b940-ff8bc21d7a87', 'd21f18be-2a96-4b09-9d50-f83c158dc120']","['fix-ocaml-gc__F8xzmqK', 'fix-ocaml-gc__jK8WwEN', 'fix-ocaml-gc__wRVy3kv', 'fix-ocaml-gc__jtt7BAp', 'fix-ocaml-gc__m7wowoJ']",0,"[3614.86428, 2787.353902, 1609.463975, 3341.003226, 3702.752326]","[121.30197, 212.305898, 32.64398, 95.059603, 47.500465]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,form-filling,5,"['e9ffdf80-dcfa-4a1d-8d5e-6768219b907a', 'c7b8b4c0-89e6-4fc2-a813-a15b8d72869d', 'be7142de-e7bd-4abe-adfd-bccb4cb63131', '6e6f8980-02c0-4217-8bce-89647196b466', '996c40a4-da12-41f1-8249-672ed8804478']","['form-filling__bvhyNwH', 'form-filling__YTkKcj5', 'form-filling__2WpMZ5W', 'form-filling__yAvFJyq', 'form-filling__xCJQHTr']",4,"[309.418837, 224.783559, 934.238207, 371.876728, 520.001461]","[24.95743, 4.888644, 3.252813, 48.824233, 5.2094]",0.8,True,"['e9ffdf80-dcfa-4a1d-8d5e-6768219b907a', 'c7b8b4c0-89e6-4fc2-a813-a15b8d72869d', '6e6f8980-02c0-4217-8bce-89647196b466', '996c40a4-da12-41f1-8249-672ed8804478']" +zai-org/GLM-4.5-Air-FP8,git-leak-recovery,5,"['1aac18c2-72b0-4cff-b235-be3d00e77c73', 'ee7c1a0e-5cf3-48da-a381-fdff2d3f3d77', '0701bd50-d081-4d54-941e-570a9d051743', '42597e46-a6a2-4106-991e-24215edae1b2', 'dade16f4-a78d-4021-9b5a-bd4783cddf91']","['git-leak-recovery__fRsFNnD', 'git-leak-recovery__pGegdxy', 'git-leak-recovery__7GbuQno', 'git-leak-recovery__pYM6BXF', 'git-leak-recovery__6T9ooBR']",4,"[110.732175, 369.341489, 109.87425, 171.647829, 343.562996]","[35.481204, 27.110198, 200.14403, 14.887537, 26.080325]",0.8,True,"['1aac18c2-72b0-4cff-b235-be3d00e77c73', 'ee7c1a0e-5cf3-48da-a381-fdff2d3f3d77', '0701bd50-d081-4d54-941e-570a9d051743', '42597e46-a6a2-4106-991e-24215edae1b2']" +zai-org/GLM-4.5-Air-FP8,gpt2-codegolf,5,"['65c308bb-ba53-4cce-8a9d-400f723ecaf7', '10209b2d-f3cd-4972-a053-f2fbcf36b593', '6d6b8567-42ba-4d1f-bdfa-d24dce3f87b7', '8ad7e586-9d2b-4290-af2e-3f0e41a6474d', '2eed3e80-a10d-427b-8494-014fc040b093']","['gpt2-codegolf__7hyp4fQ', 'gpt2-codegolf__vShjSwC', 'gpt2-codegolf__UqxZAMg', 'gpt2-codegolf__2XzXCWx', 'gpt2-codegolf__ibS4qtM']",0,"[857.213558, 168.904017, 901.027477, 900.001642, 302.317268]","[24.005177, 19.432017, 232.270762, 264.071246, 86.051675]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,hf-model-inference,5,"['5c7984d6-e2ef-41b4-910a-1e26c15e161a', '565044c7-181f-42a0-a98f-2447832364f3', '70fdd6cf-e4da-4bbb-968c-92675bbbcd99', 'f2064a7b-49fb-4cb6-b408-c9d3ee119f8f', 'f9a3195f-91b9-479e-a27b-f2f1c8a8fdc5']","['hf-model-inference__Z8aroMu', 'hf-model-inference__zNj6epC', 'hf-model-inference__QmKT52n', 'hf-model-inference__zKiaxep', 'hf-model-inference__AHtXdCJ']",4,"[214.834857, 401.206725, 363.338164, 92.532709, 1993.84101]","[41.313571, 27.728605, 24.245601, 37.746494, 175.717729]",0.8,True,"['5c7984d6-e2ef-41b4-910a-1e26c15e161a', '565044c7-181f-42a0-a98f-2447832364f3', '70fdd6cf-e4da-4bbb-968c-92675bbbcd99', 'f2064a7b-49fb-4cb6-b408-c9d3ee119f8f']" +zai-org/GLM-4.5-Air-FP8,install-klee-minimal,5,"['06b36570-1863-4146-99f7-f761290703de', '760e7d17-6e86-4ecb-8b61-2997998a78d3', '6c28df03-b3fe-41cc-9a5d-86278cb896f2', '87b6d493-025d-45c1-aabd-618b271a3160', '4d6deb71-731d-4035-9dd3-f06cc813c1dc']","['install-klee-minimal__7F5CwUv', 'install-klee-minimal__f68MMHC', 'install-klee-minimal__Gjw5eH2', 'install-klee-minimal__hXEUcLU', 'install-klee-minimal__sFjKAeA']",0,"[903.034776, 908.220079, 913.315869, 826.878221, 908.189576]","[40.729916, 131.779264, 103.763285, 36.264364, 199.090493]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,install-windows-3.11,5,"['85e219a4-6110-44df-a2e3-26e6a853efe8', '1e4f776b-7524-44f2-b9e0-a5be702eeb72', 'd9ce4c6b-953a-4ad8-85bb-fd3bf6881c7c', 'f3aaaa56-3b9c-4dbd-bfb8-68e1a418e5d4', '330709c5-8f13-415d-9c64-3b9dfac60680']","['install-windows-3.11__ABZgTtG', 'install-windows-3.11__LsEbtR8', 'install-windows-3.11__Ps4uFMX', 'install-windows-3.11__xeSuuQm', 'install-windows-3.11__6Lh5qFp']",0,"[757.110773, 352.388501, 131.930154, 256.979049, 221.956582]","[39.916464, 25.565403, 15.129767, 33.095771, 20.098376]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,large-scale-text-editing,5,"['3ec0518d-d1e2-4246-9c27-c003aa02591b', '86ea8d23-553c-4389-8d31-94f5fcac083e', '1dfcc15f-dbef-4f83-b13f-e6b695ff212a', '73b8911b-f3d3-454f-a837-e3453ea2078d', 'ddc7930d-eace-4d8c-9b88-f5245baceeaf']","['large-scale-text-editing__UKmq8Vi', 'large-scale-text-editing__dDdCNAF', 'large-scale-text-editing__L5aCwgJ', 'large-scale-text-editing__K7X6t3b', 'large-scale-text-editing__5wBQkFF']",0,"[1229.003979, 1211.805926, 1212.510062, 1200.820858, 220.464173]","[11.030312, 71.080175, 207.15367, 41.029486, 137.158357]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,largest-eigenval,5,"['a648dfae-38b0-446d-88c0-ff179e335af1', 'e34312a2-c0e0-4b20-aa22-52fe9ca8bc63', '568e5d2b-7dcd-48c1-b46c-9236bf862ad0', '25234113-072e-4896-ae82-43e0cb6fb206', 'eed1b113-389a-4d74-9ac4-983b7a2b0ab3']","['largest-eigenval__2AgY7WV', 'largest-eigenval__qhbVn8M', 'largest-eigenval__7qGeYBu', 'largest-eigenval__75PxZMx', 'largest-eigenval__8KnRXGV']",0,"[900.375306, 900.005405, 900.849507, 900.562171, 339.727485]","[131.750173, 65.005076, 346.989493, 33.312607, 52.656222]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,log-summary-date-ranges,5,"['26c91249-e0b4-4f73-83fa-ad08aad206d0', '4f0c8ed6-bccf-4714-a72d-0783b6d98c07', '6747793e-147a-4d60-9c25-5b13ee9946ab', '3573c70c-9740-4872-961b-6f84a624b0a2', '9a13732f-f64a-4144-98b2-86de1cf7d49d']","['log-summary-date-ranges__FSmEahq', 'log-summary-date-ranges__ef6yfnD', 'log-summary-date-ranges__UFnuoDG', 'log-summary-date-ranges__sqokgV9', 'log-summary-date-ranges__HWNjdsd']",4,"[81.057681, 248.297571, 76.797332, 131.317284, 99.454935]","[42.973802, 35.806237, 17.770023, 28.814233, 30.812428]",0.8,True,"['26c91249-e0b4-4f73-83fa-ad08aad206d0', '6747793e-147a-4d60-9c25-5b13ee9946ab', '3573c70c-9740-4872-961b-6f84a624b0a2', '9a13732f-f64a-4144-98b2-86de1cf7d49d']" +zai-org/GLM-4.5-Air-FP8,make-doom-for-mips,5,"['d5dba17f-42af-47c5-ba4b-2c84e3114d67', 'dfe643eb-2a79-4085-8378-ccdeb30c6a4a', '9a90c6c3-aa44-41d3-80a0-dfd2f4b3d7d4', '1b54179d-a9d4-4225-8a79-495a68f3a314', '85b372ee-f223-43a8-98a1-0a4dc1cb0344']","['make-doom-for-mips__opMJUqY', 'make-doom-for-mips__BMHGyi9', 'make-doom-for-mips__gs8gjZw', 'make-doom-for-mips__7pVqdUk', 'make-doom-for-mips__CqQLiwq']",0,"[916.121096, 905.865221, 904.808309, 920.134017, 904.991394]","[22.526745, 229.401994, 34.838793, 123.147524, 17.895625]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,make-mips-interpreter,5,"['f49a9401-7489-4781-87bc-d4ef02469b86', '13de0ee6-dd4d-4fb9-b751-6d1e7955403e', '20385de8-e4a0-454d-a96b-0ebc7c58f009', '5983b664-fe7c-49f3-9448-b5fa5545a56d', '946d672b-2327-4949-a23c-f8ea8e92b420']","['make-mips-interpreter__RDdJtiS', 'make-mips-interpreter__EtCuNBg', 'make-mips-interpreter__UGZfkdw', 'make-mips-interpreter__S8hXdQq', 'make-mips-interpreter__LkRjdKy']",0,"[673.881244, 1323.677248, 2101.725902, 1802.970575, 1683.325587]","[47.097406, 194.419852, 16.112872, 83.449289, 33.63011]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,merge-diff-arc-agi-task,5,"['970711a8-9e14-463e-b651-7362ca3795f9', '4f9d41cd-5294-4170-9300-ebdae84af03a', '1e54ae00-bb5c-4ff1-b6d5-9909abe6e526', '3751bb05-2ea2-4b84-bf8a-3594ece74bab', '868da0d2-e226-4448-acb9-168cabbf341d']","['merge-diff-arc-agi-task__XXymzSW', 'merge-diff-arc-agi-task__NNoCRtZ', 'merge-diff-arc-agi-task__gX2wVSY', 'merge-diff-arc-agi-task__dmNPopz', 'merge-diff-arc-agi-task__rgSTsMV']",0,"[809.795325, 221.573557, 468.390265, 246.856887, 231.623286]","[34.123208, 28.265583, 18.684644, 64.738423, 43.540469]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,model-extraction-relu-logits,5,"['94863fd0-50ce-4be6-894a-eb0d0256c2e0', '9b67c678-9b71-4b5b-aa21-c6deef3ade25', '594d949b-996a-455e-a8e9-ed0b73e43599', '54892a94-1dbb-489e-9334-0b5731df9907', '415cdd03-528d-4b67-a938-a898df6e9557']","['model-extraction-relu-logits__6TtRNmG', 'model-extraction-relu-logits__fpdRRPi', 'model-extraction-relu-logits__zjVtBuR', 'model-extraction-relu-logits__veGTqjw', 'model-extraction-relu-logits__PisZ2Uy']",1,"[140.90876, 191.329676, 1420.756777, 505.36828, 775.494639]","[8.695344, 17.815283, 15.125184, 204.411261, 223.124643]",0.2,False,['415cdd03-528d-4b67-a938-a898df6e9557'] +zai-org/GLM-4.5-Air-FP8,mteb-leaderboard,5,"['44091860-050c-4600-b44f-33e55237725a', '0b8e5b1b-837a-4ec5-b4f2-585390455db3', '38d9a557-1971-44a5-8cad-88d2169cbc85', 'c2979f38-57fd-4840-8a52-8f2f1fd0dcd8', '9b40c39e-991f-4f66-b788-45ec57a002a8']","['mteb-leaderboard__wznCSaA', 'mteb-leaderboard__GFgaMmK', 'mteb-leaderboard__5wQuY2v', 'mteb-leaderboard__UnLxukF', 'mteb-leaderboard__TjWLSjq']",0,"[495.409632, 495.884827, 2124.028368, 398.055009, 1394.095312]","[4.1917, 6.593782, 4.430772, 48.586838, 63.992785]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,mteb-retrieve,5,"['3bed7855-83c6-4c4d-9a9d-1014281a242b', '25c1c06e-4b62-44cb-a243-aec64a207fe7', 'c4f52e70-fda2-4b9a-ac50-f213cb82c082', '6d885e3b-9105-4172-8976-aeeae03ed579', 'f302d744-5403-4158-86c2-bf63c21e8585']","['mteb-retrieve__5iSDq6C', 'mteb-retrieve__GzNFVjb', 'mteb-retrieve__ez2Y3T5', 'mteb-retrieve__6E88ipx', 'mteb-retrieve__4fuXoHf']",0,"[486.003296, 154.485415, 102.981173, 420.028343, 586.633852]","[42.347753, 4.590859, 68.692181, 110.908188, 10.002214]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,nginx-request-logging,5,"['d7fe02c2-1891-46db-97cd-a17e9c05026f', '97130dad-35ce-4177-bf17-58dbc95f4658', '3bd06a7a-8261-4383-a026-279a27170652', '9b9e8459-3941-4868-94e5-1ae0a26950a1', '4c5acd84-198a-48f1-95cd-255cfb2b8101']","['nginx-request-logging__Yj4um9P', 'nginx-request-logging__i5i8PT9', 'nginx-request-logging__r82Duht', 'nginx-request-logging__iCfyB86', 'nginx-request-logging__brtJK2J']",5,"[582.483279, 75.09853, 580.678413, 347.928665, 530.223748]","[56.940963, 13.163444, 58.25988, 38.198793, 89.756465]",1.0,True,"['d7fe02c2-1891-46db-97cd-a17e9c05026f', '97130dad-35ce-4177-bf17-58dbc95f4658', '3bd06a7a-8261-4383-a026-279a27170652', '9b9e8459-3941-4868-94e5-1ae0a26950a1', '4c5acd84-198a-48f1-95cd-255cfb2b8101']" +zai-org/GLM-4.5-Air-FP8,openssl-selfsigned-cert,5,"['b2f5c470-3a1e-4068-9126-9f7b9fc91d2d', '7b3ba137-5dfd-4b78-ac8a-e1147a2b7ccf', '98af9e50-52ee-4dbf-8410-e153ac044635', '3f004be1-e93e-460d-97e2-c5a20559ee7d', '26613299-6966-41ae-854d-71cc91bc7a2d']","['openssl-selfsigned-cert__vr7Mgbf', 'openssl-selfsigned-cert__4gqVUNJ', 'openssl-selfsigned-cert__WKmJ9VR', 'openssl-selfsigned-cert__afJi9FQ', 'openssl-selfsigned-cert__tpVZtFF']",0,"[49.326186, 58.879297, 57.877799, 91.605442, 204.033374]","[35.563306, 54.407272, 27.54588, 64.993975, 28.197871]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,password-recovery,5,"['a15ad217-6647-4260-8cb8-0f49bf2ad5f3', '6c696321-e0b5-4a3d-8b7f-76898e5d6557', '474e9c2c-4df7-4ce5-b8bf-3d529dd73476', '1bb8f992-8194-41e7-9883-fb16c90a7b22', '747a96ff-d388-4ec6-9db4-0411c63ec1eb']","['password-recovery__Mz9wiH6', 'password-recovery__8vztZEf', 'password-recovery__bNCMTzh', 'password-recovery__hFMG5fZ', 'password-recovery__vYDt3N2']",0,"[761.301874, 901.521805, 902.199165, 702.088208, 906.033574]","[28.002243, 26.315803, 34.711169, 49.917085, 27.384423]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,path-tracing,5,"['ccc90aa0-cf7a-4035-81cd-0f8466951ee7', '1f705936-1ea7-4b1d-9c72-a1d7e9412b14', '434b8a92-ba4a-4dd3-9454-a86c668d7c43', 'c91d7024-e738-4612-a9fb-42a566d2e481', '1c68ee78-4dd8-44b0-b2b9-530f1b920b02']","['path-tracing__s3eAWHq', 'path-tracing__i6PLyWf', 'path-tracing__6JaisYQ', 'path-tracing__XZnCFHC', 'path-tracing__ajPrayK']",0,"[191.306486, 575.254942, 95.967614, 1045.947678, 1804.329302]","[94.71642, 47.041039, 29.890431, 18.447113, 71.209928]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,path-tracing-reverse,5,"['62ca9656-d6a6-4bfd-a12a-b09a325c9447', '8beaeca1-7396-4022-b39f-d2d0b04fd2a9', '74dc8e27-bf5f-4947-bb54-3b618dcadb16', '1ef92e4c-b367-4a6f-b7d7-67d2de7d6587', '8eb0c138-8356-4030-8327-32af4706cdd6']","['path-tracing-reverse__6Fpa68f', 'path-tracing-reverse__XfyZGCq', 'path-tracing-reverse__sTLgsFD', 'path-tracing-reverse__myJ5mhB', 'path-tracing-reverse__489SEW6']",0,"[1104.712887, 462.020406, 1585.560612, 254.990001, 1811.171133]","[61.554167, 49.668913, 51.067905, 11.395838, 62.5793]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,polyglot-c-py,5,"['151a4206-4449-4589-b83d-af018ea3764a', '7c243181-72d3-4a7f-b77e-786e6f078457', 'a39acfd1-92df-4f23-be2b-f8d34b95e99d', '91735112-00ac-4875-8de9-b2f1e7aba7a3', '88a3bb0f-0ea8-46db-9837-30606364e166']","['polyglot-c-py__7E7HKEc', 'polyglot-c-py__rspQUhX', 'polyglot-c-py__SRmoGhm', 'polyglot-c-py__g3GAud3', 'polyglot-c-py__3LYScUJ']",0,"[900.075737, 919.331625, 58.540728, 911.513251, 1025.306904]","[68.94914, 26.208619, 18.195473, 55.268278, 21.355707]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,polyglot-rust-c,5,"['c16c931c-8084-469c-80e6-14104a705635', '681bc96d-2a38-4a72-bd84-f95c3729ebfb', 'db0686cb-5e8b-4af6-b897-5b4d540288e5', '12fd4ea7-602b-454c-a88f-0d59b7a7c358', '00bc7790-2d01-4841-bab5-43d50d17197c']","['polyglot-rust-c__mKPXus6', 'polyglot-rust-c__Pt8yLSC', 'polyglot-rust-c__28yBLw9', 'polyglot-rust-c__2NQAnxo', 'polyglot-rust-c__WVfbkum']",0,"[900.023997, 906.801652, 910.165354, 900.103093, 94.30796]","[47.03264, 94.513468, 103.161475, 49.435056, 28.231835]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,port-compressor,6,"['e720d6d4-daa6-4ccd-8deb-1db209933c69', '6aabb34e-4f54-4658-a7d1-a4a438907b84', '85fe6953-69d1-4aee-b6d9-00cb15afc512', '598a9242-7093-4737-a04a-cd53d5bec3d6', 'd1a0fa61-58d0-47e6-81d5-11f7d52a8c34', '20b0e75c-448b-4c77-ba8b-a22400256879']","['port-compressor__FkpAG2A', 'port-compressor__6fHBM78', 'port-compressor__Ks2qnbM', 'port-compressor__TFpXaDm', 'port-compressor__YgLEWN3', 'port-compressor__tR6nWLh']",0,"[3619.290197, 3607.651755, 969.220147, 3619.726052, 917.273604, 3615.199374]","[58.091571, 49.291129, 10.088442, 47.895726, 23.877296, 136.602485]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,prove-plus-comm,5,"['9c234dc1-abf2-4cbc-9014-3c82cbb2c0b2', 'cf934e81-c8ea-43fb-bc7d-79b384b90e57', 'a79ab506-a529-489d-b2b1-6d39587c5ef9', '2712bc11-7a50-4d3a-b1d8-32791b653c89', '3630bc08-1f8a-4ba3-a7c0-53734ac59724']","['prove-plus-comm__8SsceKf', 'prove-plus-comm__CBqJzzi', 'prove-plus-comm__GD57wfC', 'prove-plus-comm__M4uaQK6', 'prove-plus-comm__emxyVmB']",4,"[517.126616, 912.975059, 166.383672, 712.82138, 867.81343]","[91.324117, 26.718244, 60.298775, 61.849524, 91.797051]",0.8,True,"['9c234dc1-abf2-4cbc-9014-3c82cbb2c0b2', 'a79ab506-a529-489d-b2b1-6d39587c5ef9', '2712bc11-7a50-4d3a-b1d8-32791b653c89', '3630bc08-1f8a-4ba3-a7c0-53734ac59724']" +zai-org/GLM-4.5-Air-FP8,pypi-server,5,"['20aabab7-1d52-463e-9ced-3c5ba07deedc', '1bc29876-46a9-4dc2-a58a-55ce61e57bc4', '9a968ce0-e84e-4f35-a35b-6dea268270fc', '8ca02970-58fa-48fd-893c-1b13f2a64207', '8bab85bc-7dd8-4a3a-98b8-a4050319f92b']","['pypi-server__F4EYtKF', 'pypi-server__KaNLkG2', 'pypi-server__5i4CUf8', 'pypi-server__6TsSEry', 'pypi-server__PY3fCvx']",1,"[436.588969, 361.469137, 900.026183, 789.345523, 504.888556]","[23.593487, 33.934523, 41.720869, 49.204884, 30.840273]",0.2,False,['8bab85bc-7dd8-4a3a-98b8-a4050319f92b'] +zai-org/GLM-4.5-Air-FP8,pytorch-model-cli,5,"['c1074f82-7eed-4300-91dc-6076e76b1e38', 'e3dd65b1-cb80-4963-8c82-707803ca8ff8', '299add31-1e46-41ad-92d8-8ca2a9e27ea2', '087e039f-7892-4f40-b99d-d15963c6294d', 'e7d7c391-ec9f-4838-9608-ba582af2f270']","['pytorch-model-cli__FgFWnKj', 'pytorch-model-cli__KtpiWNW', 'pytorch-model-cli__EdB9PPP', 'pytorch-model-cli__jiNRFtM', 'pytorch-model-cli__BzkT276']",0,"[732.154506, 1997.071165, 435.326062, 901.222718, 732.785804]","[25.781472, 14.119678, 39.681109, 96.480546, 127.880262]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,pytorch-model-recovery,5,"['dc9de74b-2e17-482f-b32c-8a86c54a3501', '14513e5c-1d1b-490c-95f8-6629a680a73d', 'cb1205e5-f7f4-43c4-b0fd-cd5768282a88', 'fec88f33-335d-4ec8-b8a4-230bb16670f1', '74521611-61df-4af6-aa93-efc2214ec6eb']","['pytorch-model-recovery__GkjtQd6', 'pytorch-model-recovery__dixkxoz', 'pytorch-model-recovery__i8LJFYH', 'pytorch-model-recovery__TvUAD2g', 'pytorch-model-recovery__NCCAwM7']",2,"[817.002718, 912.530928, 900.045265, 462.700587, 900.00613]","[48.64678, 26.96556, 16.521744, 69.206309, 28.680298]",0.4,False,"['dc9de74b-2e17-482f-b32c-8a86c54a3501', 'cb1205e5-f7f4-43c4-b0fd-cd5768282a88']" +zai-org/GLM-4.5-Air-FP8,qemu-alpine-ssh,5,"['6b95e0dd-69f3-47b9-90e0-fcac5abaa2c9', '27d7f820-23b9-4ef4-b0af-26f76c5a9ef0', '50275210-8562-48a2-972c-2e6ae755371c', '3112ec9d-e5e1-4832-a612-c18f38016c19', '8d358420-62e4-4edc-b062-018556def2d8']","['qemu-alpine-ssh__8qZuyxz', 'qemu-alpine-ssh__K2Ko89R', 'qemu-alpine-ssh__MQ8Nq2e', 'qemu-alpine-ssh__bfrVuVK', 'qemu-alpine-ssh__7KFYQxq']",0,"[900.017509, 234.124801, 1046.068728, 916.004436, 858.671527]","[5.152945, 3.919945, 4.494711, 8.92276, 60.084368]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,qemu-startup,5,"['f284a38b-f6a0-4af8-a2e1-77982f8da90d', '6cd20851-258a-4dbb-8c63-3fe245907956', '075f1854-8fee-4dcd-9aa1-7f288399efbb', 'aced6db1-10a1-4e04-bd71-1e5fadde2767', '6e59ef96-22fa-41c3-baf3-b8ecaf4e9291']","['qemu-startup__qrSKYPB', 'qemu-startup__aaMgVxQ', 'qemu-startup__gLeUmPG', 'qemu-startup__K5NCYzq', 'qemu-startup__BGYuCBV']",1,"[906.872479, 908.882791, 136.411497, 471.67324, 900.013156]","[171.861712, 8.21656, 10.943761, 3.773959, 6.670596]",0.2,False,['075f1854-8fee-4dcd-9aa1-7f288399efbb'] +zai-org/GLM-4.5-Air-FP8,regex-log,5,"['911b0fa0-b953-46ba-b240-c98cdb1e7c56', '21daf928-d0ec-4df8-b867-b5c1e28357ff', 'a2f0f358-ecd2-4984-bb18-f682b13b2a26', '845efb28-c26a-40e9-9ee5-1c658d898fa4', 'd13f8495-2b48-4b15-8658-f186ceb675a4']","['regex-log__9igK3W6', 'regex-log__hFyNhbR', 'regex-log__w8N7aTB', 'regex-log__Z9aR4Nj', 'regex-log__M4Urv3Y']",1,"[330.257806, 163.981409, 271.495067, 392.381113, 93.218095]","[115.229451, 117.252139, 77.549072, 83.872558, 154.883355]",0.2,False,['845efb28-c26a-40e9-9ee5-1c658d898fa4'] +zai-org/GLM-4.5-Air-FP8,reshard-c4-data,5,"['190922b4-bc91-4467-aa14-ea3264e1a6b8', 'e7c99fd9-783f-459b-b8f0-ca5a1c8cbe0d', '6e59646a-cf75-4889-9f4e-8244174511ea', 'b95d03c8-a3bd-48c4-a1db-6fdfa7475cf3', '22699437-2c5d-41f4-8c26-e5a4d135c7a1']","['reshard-c4-data__hEeetmm', 'reshard-c4-data__uE6zt44', 'reshard-c4-data__FucG4Ci', 'reshard-c4-data__xF2SEZW', 'reshard-c4-data__E6NS3kB']",0,"[268.393214, 657.352434, 310.582633, 325.148476, 900.021343]","[37.426851, 35.019194, 263.377935, 86.689513, 51.317291]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,reverse-engineering,5,"['a865970a-4067-4a13-baa9-2a2f3f56922e', '3c46035e-92a3-47ac-ba2e-17387b46af4a', '90878e4b-cb20-4e13-a9b3-9fa20111a1c7', '0148ddbb-9c20-4c80-bd8a-fef94dd3bb3f', 'cb876c41-2dab-45b9-8c43-39d015a984bc']","['reverse-engineering__K2FKpZQ', 'reverse-engineering__oFKpdaw', 'reverse-engineering__3SbkAxu', 'reverse-engineering__h8vsve8', 'reverse-engineering__AGwpuVU']",0,"[1828.789441, 1815.027932, 1820.35783, 1800.102118, 2104.729972]","[45.51991, 54.644235, 92.269084, 148.953238, 13.414089]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,run-pdp11-code,5,"['61c109e3-c374-4ca8-b6a2-8aa3fdb52db8', '55b56911-006c-4204-8ee1-ebb73044ccca', '3558e4b0-365e-4230-b6a7-f0a6c0ccc2ec', 'c6adf3d9-f323-481f-a15f-75adf828209b', '2285b1a1-3b56-4727-a8c2-5bb7cea85005']","['run-pdp11-code__w4BvkJ4', 'run-pdp11-code__nG53hUr', 'run-pdp11-code__JMr4Jvh', 'run-pdp11-code__EtPWZbs', 'run-pdp11-code__3w7WmeW']",0,"[1001.108505, 46.218415, 1065.2798, 555.972537, 644.675568]","[67.333553, 48.463113, 268.778864, 101.476695, 12.812456]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,sanitize-git-repo,5,"['c5a38b9b-a3d9-49c3-b015-7882f2476bdf', 'a39fa129-34d9-4c90-b6da-8f3ea4f94b0f', 'd45e9d1a-a50f-49a1-9c67-c9bcfc90a003', '612f0235-3d20-4445-8049-029a38755416', '49d38b2b-5e4b-4efe-9838-67ac611ec8b5']","['sanitize-git-repo__hokBaza', 'sanitize-git-repo__Z8NjD2z', 'sanitize-git-repo__zARXUzp', 'sanitize-git-repo__cHJfzKV', 'sanitize-git-repo__cACGrfa']",0,"[549.336437, 468.935086, 379.461879, 278.406908, 496.186615]","[286.882374, 23.006549, 80.925295, 14.899543, 32.18624]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,schemelike-metacircular-eval,5,"['c83a3078-238e-480c-bb8c-564027231f39', 'b776f559-18fb-4c91-ab52-06d2231e58dc', '810031f6-3b2c-4382-ba5c-ff8e8d490ca1', 'b902b60d-2196-4af3-885d-3eb23731e073', '0c8edb4d-8499-42d7-9ed9-3afa993aad58']","['schemelike-metacircular-eval__kbraigB', 'schemelike-metacircular-eval__pMg9jmC', 'schemelike-metacircular-eval__D3Jshho', 'schemelike-metacircular-eval__kzvajZZ', 'schemelike-metacircular-eval__viKmMRk']",0,"[2412.515906, 905.561927, 2430.088674, 1214.766976, 2428.692674]","[46.896665, 41.149266, 92.502563, 14.334732, 13.576862]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,sparql-university,5,"['52a24d4b-ba84-4f45-b2b7-b5b4c758e82a', '87d3e970-3208-439e-844d-357a468e3946', '128e17b3-ec1f-4a61-836f-488b1390eec0', '63680ddc-5269-4de2-a3b7-edd9d8395acd', '5d0d3b90-773b-4b46-9f05-649c93b194b1']","['sparql-university__36bzvzA', 'sparql-university__GHYZUnq', 'sparql-university__usnb3vk', 'sparql-university__kpd7aZk', 'sparql-university__7pozado']",0,"[220.562767, 146.77914, 265.402405, 152.513995, 560.913123]","[32.200953, 52.335389, 19.995107, 55.032034, 350.865809]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,sqlite-db-truncate,5,"['020e26d5-5dd5-4e82-b247-f6d67bc995e6', '8644ac58-6bd4-4dbf-a75d-043cb36770ac', 'ff59fa90-6cf3-4473-a07f-9d78e7f802dc', 'ddca5d2e-c708-42f5-a5a9-b519c17c7fe8', 'ea9fd1bb-f02d-4638-a0df-dd7b6012b96d']","['sqlite-db-truncate__vVta5x3', 'sqlite-db-truncate__dNwXyWe', 'sqlite-db-truncate__vMyKCTF', 'sqlite-db-truncate__xYoJmnX', 'sqlite-db-truncate__RkSBZjD']",0,"[99.004713, 198.093197, 686.913767, 277.203435, 485.715557]","[15.211979, 12.96752, 45.32392, 106.226731, 70.096457]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,sqlite-with-gcov,5,"['a0813987-5035-4d27-a162-59491d1d7e73', '25aa4e25-852a-4e78-8936-a9ed8d107b26', '46b54077-f5eb-4df0-9539-85367512ebe8', '242d06d7-714c-4f0b-8b18-aea9c13ffaf7', '46815717-e762-4fac-9c27-cb64ac1e78a0']","['sqlite-with-gcov__NBWtSDN', 'sqlite-with-gcov__gRR2xLe', 'sqlite-with-gcov__xDjX6RW', 'sqlite-with-gcov__CQ5q6PQ', 'sqlite-with-gcov__rqErVfr']",3,"[168.923934, 692.336752, 198.423864, 674.239474, 508.10642]","[53.320608, 42.226668, 23.15191, 39.349937, 33.772471]",0.6,True,"['a0813987-5035-4d27-a162-59491d1d7e73', '25aa4e25-852a-4e78-8936-a9ed8d107b26', '46b54077-f5eb-4df0-9539-85367512ebe8']" +zai-org/GLM-4.5-Air-FP8,torch-tensor-parallelism,5,"['f0a06e59-3ed2-46db-a1c1-f4ea6e1ddd4f', '43ea0245-e4c0-41a9-a3d2-91200c59460c', '3ab4d380-e5db-4593-8bb0-3fe373d180a2', 'eadc8fa7-6d3a-4c79-8a75-f653350965df', 'e6a01123-7302-40c0-bdf7-ef2ae4b34ae9']","['torch-tensor-parallelism__bCYLfAS', 'torch-tensor-parallelism__eiUgefw', 'torch-tensor-parallelism__cxPddPX', 'torch-tensor-parallelism__Cw3mVQn', 'torch-tensor-parallelism__gZugTZS']",0,"[904.424344, 254.077497, 26.359132, 14.284388, 102.288619]","[213.792512, 70.048423, 22.733026, 13.995705, 85.633226]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,train-fasttext,5,"['d3482749-e71e-4ef4-bf2d-31898f7ce488', '600c9d42-84e0-479e-bcea-f8dd1e735257', '4972d768-75e8-4e91-ab75-f65fe5b0eb43', '0549246a-7425-4526-8c38-60f97574c8d9', '1e9848b6-6cbf-47d0-b688-b3cd14b4b65b']","['train-fasttext__hWmmPxN', 'train-fasttext__zkbeTy4', 'train-fasttext__MAEbb9w', 'train-fasttext__62q4qZg', 'train-fasttext__aRQQvVZ']",1,"[3600.002575, 2748.916437, 2870.975858, 3605.987934, 3625.402805]","[39.805922, 32.485182, 239.750791, 164.388832, 44.577294]",0.2,False,['4972d768-75e8-4e91-ab75-f65fe5b0eb43'] +zai-org/GLM-4.5-Air-FP8,tune-mjcf,5,"['add15559-6664-4fe8-a788-73a20ebdbef3', '06c76a95-74e3-4d5c-adb3-81dcd76bca94', '5b739d6d-1a5d-496b-aafe-cc66ef911032', 'c2e7a50c-ca6c-4f41-8c44-8e27cb13b82c', 'f2794c28-0dd2-46b6-80e7-93ca8845989b']","['tune-mjcf__dUBqzX6', 'tune-mjcf__UnvDwND', 'tune-mjcf__ZqB9Lnw', 'tune-mjcf__aPtaWdK', 'tune-mjcf__sed48w5']",0,"[1041.461925, 1006.430859, 900.470388, 908.918819, 903.518]","[99.236811, 23.931194, 8.477091, 30.350851, 25.028757]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,video-processing,5,"['5d0ac4c3-8c0f-489f-ab07-d061377af674', '6ca070b1-3979-4e06-ad4c-03d2614ce63e', 'e3847b5a-5852-4d7b-9afa-1284763c6f05', '559b97d7-851a-49d4-808b-5b4fa4a20bfa', '7ad798f8-fb44-4af6-bd6d-e7d87a048706']","['video-processing__KppAAYh', 'video-processing__ALKWRtL', 'video-processing__5KC6EGz', 'video-processing__jnTtgeb', 'video-processing__Joz6dWa']",0,"[191.889484, 527.88485, 161.489294, 234.021947, 273.544293]","[17.38842, 69.007088, 86.240516, 28.871944, 83.007525]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,vulnerable-secret,5,"['eeab8b70-db97-416b-ac6b-41fc31c0f0d1', '3e69bdec-98d9-4b7c-9a5c-a88eef5d2fe1', '8ba1e39b-cbed-4f33-857a-86380ab4fb7e', '22f4265a-71d9-4535-afe9-34615065d4ab', '8619b2de-26fe-47ed-9f7c-df0395e5ed1a']","['vulnerable-secret__V9B4LYf', 'vulnerable-secret__GGTELaJ', 'vulnerable-secret__gzDfHzx', 'vulnerable-secret__Bz3hd7A', 'vulnerable-secret__DsyQeNx']",0,"[907.118781, 912.382655, 900.134525, 906.501625, 935.518186]","[11.044046, 34.876948, 14.010159, 81.282046, 25.832637]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,wasm-pipeline,5,"['7412edec-d8f6-4226-9342-f5053ebcb1a4', '0358c863-4758-404c-a034-94d684264187', 'd2458b21-a700-4b66-929c-faf70a4307fe', '2f48f6d3-9a5c-4470-bcc6-965701171f94', 'c7cad823-9eff-4326-be3c-765f4cc43bd8']","['wasm-pipeline__L6akytZ', 'wasm-pipeline__DSckHND', 'wasm-pipeline__GxCAqT2', 'wasm-pipeline__iZqxhgu', 'wasm-pipeline__QTByGeE']",1,"[124.992499, 1033.663767, 366.979884, 901.235036, 508.230362]","[24.605003, 47.653542, 10.669574, 5.423698, 3.663403]",0.2,False,['d2458b21-a700-4b66-929c-faf70a4307fe'] +zai-org/GLM-4.5-Air-FP8,winning-avg-corewars,5,"['dd474613-0f9d-4aa0-984a-667e63e3b148', '2ee959fe-3642-4857-99f6-1c5007862703', 'fa474802-3795-42c2-8752-b0f71a729c48', '2126039e-fb03-4bdc-b5fb-bb77d6cbfe77', '2bc6222f-959d-4abe-85ab-92eae12560b4']","['winning-avg-corewars__NiRM2Gy', 'winning-avg-corewars__FWoBpoy', 'winning-avg-corewars__4CP9CL3', 'winning-avg-corewars__MgXTUFj', 'winning-avg-corewars__LHYPbK5']",0,"[1501.310929, 3606.37442, 972.475061, 372.466426, 1660.27635]","[55.433166, 10.733242, 60.576597, 21.850351, 10.939742]",0.0,False,[] +zai-org/GLM-4.5-Air-FP8,write-compressor,5,"['6fe5b1bf-fdf7-4e7b-bc91-671c8b2cdb4a', '14febac8-9296-4e61-9de1-0191f1e780bd', '73134e5c-f967-4229-80a9-1c8da840cbec', '9d4f126a-1f1d-4a75-8c9d-a0ac12c9b84b', 'dd4f3027-2b94-401c-814f-e33efb8c1fc9']","['write-compressor__uxzzit7', 'write-compressor__cdis8t5', 'write-compressor__xFdngdV', 'write-compressor__GRQ9bPL', 'write-compressor__hoyaMu4']",0,"[902.319958, 909.351836, 900.281979, 1033.294118, 831.477683]","[66.406618, 78.634018, 18.540349, 683.18249, 24.89933]",0.0,False,[] diff --git a/notebooks/difficulty_analysis_pipeline/results/task_difficulty.csv b/notebooks/difficulty_analysis_pipeline/results/task_difficulty.csv new file mode 100644 index 0000000..e740938 --- /dev/null +++ b/notebooks/difficulty_analysis_pipeline/results/task_difficulty.csv @@ -0,0 +1,75 @@ +task_name,model_resolve_rate,model_difficulty,human_difficulty,total_models_tested,models_that_resolve,resolving_models,non_resolving_models +adaptive-rejection-sampler,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +bn-fit-modify,0.25,hard,hard,16,4,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gpt-5-mini', 'grok-4-0709']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +break-filter-js-from-html,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +build-cython-ext,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +build-initramfs-qemu,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +build-pmars,0.5625,medium,medium,16,9,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'claude-opus-4-1-20250805', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b']" +build-pov-ray,0.3125,hard,medium,16,5,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-pro', 'grok-4-0709', 'moonshotai/Kimi-K2-Instruct-0905']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +cancel-async-tasks,0.375,medium,hard,16,6,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'gpt-5', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']","['OpenAI/gpt-oss-20B', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'zai-org/GLM-4.5-Air-FP8']" +chess-best-move,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +circuit-fibsqrt,0.0625,hard,hard,16,1,['gpt-5'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +cobol-modernization,0.5625,medium,hard,16,9,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'gemini-2.5-flash', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'zai-org/GLM-4.5-Air-FP8']" +code-from-image,0.1875,hard,medium,16,3,"['deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'moonshotai/Kimi-K2-Instruct-0905']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +configure-git-webserver,0.5625,medium,hard,16,9,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gpt-5', 'gpt-5-mini', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']","['OpenAI/gpt-oss-20B', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'zai-org/GLM-4.5-Air-FP8']" +constraints-scheduling,0.75,easy,medium,16,12,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'gemini-2.5-flash', 'gpt-5-nano', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8']" +count-dataset-tokens,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +crack-7z-hash,0.5,medium,medium,16,8,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'grok-4-0709', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +db-wal-recovery,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +distribution-search,0.3125,hard,medium,16,5,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +dna-assembly,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +dna-insert,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +extract-elf,0.375,medium,medium,16,6,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gpt-5-mini', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905']","['OpenAI/gpt-oss-20B', 'claude-sonnet-4-20250514', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +feal-differential-cryptanalysis,0.125,hard,hard,16,2,"['gemini-2.5-pro', 'grok-4-0709']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +feal-linear-cryptanalysis,0.0625,hard,hard,16,1,['gpt-5'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +filter-js-from-html,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +financial-document-processor,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +fix-code-vulnerability,0.0625,hard,hard,16,1,['claude-sonnet-4-20250514'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +fix-git,0.75,easy,medium,16,12,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8']" +fix-ocaml-gc,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +form-filling,0.6875,easy,medium,16,11,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'gemini-2.5-flash', 'gemini-2.5-pro', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8']" +git-leak-recovery,0.625,medium,medium,16,10,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'openai/gpt-oss-120b']" +gpt2-codegolf,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +hf-model-inference,0.5,medium,medium,16,8,"['deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gpt-5-nano', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']" +install-klee-minimal,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +install-windows-3.11,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +large-scale-text-editing,0.125,hard,medium,16,2,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +largest-eigenval,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +log-summary-date-ranges,0.3125,hard,medium,16,5,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'moonshotai/Kimi-K2-Instruct-0905', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b']" +make-doom-for-mips,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +make-mips-interpreter,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +merge-diff-arc-agi-task,0.1875,hard,medium,16,3,"['gemini-2.5-pro', 'gpt-5', 'grok-code-fast-1']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +model-extraction-relu-logits,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +mteb-leaderboard,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +mteb-retrieve,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +nginx-request-logging,0.375,medium,medium,16,6,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-pro', 'gpt-5', 'grok-4-0709', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']" +openssl-selfsigned-cert,0.5625,medium,medium,16,9,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'gemini-2.5-flash', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'zai-org/GLM-4.5-Air-FP8']" +password-recovery,0.0625,hard,hard,16,1,['claude-opus-4-1-20250805'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +path-tracing,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +path-tracing-reverse,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +polyglot-c-py,0.0625,hard,medium,16,1,['grok-4-0709'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +polyglot-rust-c,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +port-compressor,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +prove-plus-comm,0.6875,easy,medium,16,11,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8']" +pypi-server,0.375,medium,medium,16,6,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +pytorch-model-cli,0.0625,hard,medium,16,1,['grok-4-0709'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +pytorch-model-recovery,0.375,medium,medium,16,6,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'grok-code-fast-1']","['OpenAI/gpt-oss-20B', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +qemu-alpine-ssh,0.125,hard,medium,16,2,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +qemu-startup,0.125,hard,medium,16,2,"['gpt-5', 'gpt-5-mini']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +regex-log,0.4375,medium,medium,16,7,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +reshard-c4-data,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +reverse-engineering,0.0625,hard,hard,16,1,['gpt-5'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +run-pdp11-code,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +sanitize-git-repo,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +schemelike-metacircular-eval,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +sparql-university,0.125,hard,hard,16,2,"['gemini-2.5-pro', 'gpt-5']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +sqlite-db-truncate,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +sqlite-with-gcov,0.5,medium,medium,16,8,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'claude-sonnet-4-20250514', 'gemini-2.5-flash', 'gpt-5', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905']" +torch-tensor-parallelism,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +train-fasttext,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +tune-mjcf,0.0625,hard,medium,16,1,['gemini-2.5-flash'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +video-processing,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +vulnerable-secret,0.25,hard,medium,16,4,"['claude-opus-4-1-20250805', 'gemini-2.5-pro', 'grok-4-0709', 'grok-code-fast-1']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +wasm-pipeline,0.25,hard,medium,16,4,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'gpt-5', 'gpt-5-mini']","['OpenAI/gpt-oss-20B', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +winning-avg-corewars,0.0,hard,medium,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" +write-compressor,0.0,hard,hard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']" diff --git a/notebooks/difficulty_analysis_pipeline/results/task_resolution.csv b/notebooks/difficulty_analysis_pipeline/results/task_resolution.csv new file mode 100644 index 0000000..06695cc --- /dev/null +++ b/notebooks/difficulty_analysis_pipeline/results/task_resolution.csv @@ -0,0 +1,75 @@ +task_name,total_models_tested,models_that_resolve,resolving_models,non_resolving_models,model_resolve_rate +adaptive-rejection-sampler,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +bn-fit-modify,16,4,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gpt-5-mini', 'grok-4-0709']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.25 +break-filter-js-from-html,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +build-cython-ext,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +build-initramfs-qemu,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +build-pmars,16,9,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'claude-opus-4-1-20250805', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b']",0.5625 +build-pov-ray,16,5,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-pro', 'grok-4-0709', 'moonshotai/Kimi-K2-Instruct-0905']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.3125 +cancel-async-tasks,16,6,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'gpt-5', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']","['OpenAI/gpt-oss-20B', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'zai-org/GLM-4.5-Air-FP8']",0.375 +chess-best-move,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +circuit-fibsqrt,16,1,['gpt-5'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0625 +cobol-modernization,16,9,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'gemini-2.5-flash', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'zai-org/GLM-4.5-Air-FP8']",0.5625 +code-from-image,16,3,"['deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'moonshotai/Kimi-K2-Instruct-0905']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.1875 +configure-git-webserver,16,9,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gpt-5', 'gpt-5-mini', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']","['OpenAI/gpt-oss-20B', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'zai-org/GLM-4.5-Air-FP8']",0.5625 +constraints-scheduling,16,12,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'gemini-2.5-flash', 'gpt-5-nano', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8']",0.75 +count-dataset-tokens,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +crack-7z-hash,16,8,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'grok-4-0709', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.5 +db-wal-recovery,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +distribution-search,16,5,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.3125 +dna-assembly,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +dna-insert,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +extract-elf,16,6,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gpt-5-mini', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905']","['OpenAI/gpt-oss-20B', 'claude-sonnet-4-20250514', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.375 +feal-differential-cryptanalysis,16,2,"['gemini-2.5-pro', 'grok-4-0709']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.125 +feal-linear-cryptanalysis,16,1,['gpt-5'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0625 +filter-js-from-html,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +financial-document-processor,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +fix-code-vulnerability,16,1,['claude-sonnet-4-20250514'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0625 +fix-git,16,12,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8']",0.75 +fix-ocaml-gc,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +form-filling,16,11,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'gemini-2.5-flash', 'gemini-2.5-pro', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8']",0.6875 +git-leak-recovery,16,10,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'openai/gpt-oss-120b']",0.625 +gpt2-codegolf,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +hf-model-inference,16,8,"['deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gpt-5-nano', 'grok-code-fast-1', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']",0.5 +install-klee-minimal,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +install-windows-3.11,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +large-scale-text-editing,16,2,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.125 +largest-eigenval,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +log-summary-date-ranges,16,5,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'moonshotai/Kimi-K2-Instruct-0905', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'openai/gpt-oss-120b']",0.3125 +make-doom-for-mips,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +make-mips-interpreter,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +merge-diff-arc-agi-task,16,3,"['gemini-2.5-pro', 'gpt-5', 'grok-code-fast-1']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.1875 +model-extraction-relu-logits,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +mteb-leaderboard,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +mteb-retrieve,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +nginx-request-logging,16,6,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-pro', 'gpt-5', 'grok-4-0709', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']",0.375 +openssl-selfsigned-cert,16,9,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'gemini-2.5-flash', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'zai-org/GLM-4.5-Air-FP8']",0.5625 +password-recovery,16,1,['claude-opus-4-1-20250805'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0625 +path-tracing,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +path-tracing-reverse,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +polyglot-c-py,16,1,['grok-4-0709'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0625 +polyglot-rust-c,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +port-compressor,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +prove-plus-comm,16,11,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8']",0.6875 +pypi-server,16,6,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.375 +pytorch-model-cli,16,1,['grok-4-0709'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0625 +pytorch-model-recovery,16,6,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'grok-code-fast-1']","['OpenAI/gpt-oss-20B', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.375 +qemu-alpine-ssh,16,2,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.125 +qemu-startup,16,2,"['gpt-5', 'gpt-5-mini']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.125 +regex-log,16,7,"['claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'grok-4-0709']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'deepseek-ai/DeepSeek-V3.1', 'gpt-5-nano', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.4375 +reshard-c4-data,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +reverse-engineering,16,1,['gpt-5'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0625 +run-pdp11-code,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +sanitize-git-repo,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +schemelike-metacircular-eval,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +sparql-university,16,2,"['gemini-2.5-pro', 'gpt-5']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.125 +sqlite-db-truncate,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +sqlite-with-gcov,16,8,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5-mini', 'gpt-5-nano', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']","['OpenAI/gpt-oss-20B', 'claude-sonnet-4-20250514', 'gemini-2.5-flash', 'gpt-5', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905']",0.5 +torch-tensor-parallelism,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +train-fasttext,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +tune-mjcf,16,1,['gemini-2.5-flash'],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0625 +video-processing,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +vulnerable-secret,16,4,"['claude-opus-4-1-20250805', 'gemini-2.5-pro', 'grok-4-0709', 'grok-code-fast-1']","['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.25 +wasm-pipeline,16,4,"['Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-sonnet-4-20250514', 'gpt-5', 'gpt-5-mini']","['OpenAI/gpt-oss-20B', 'claude-opus-4-1-20250805', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.25 +winning-avg-corewars,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 +write-compressor,16,0,[],"['OpenAI/gpt-oss-20B', 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8', 'claude-opus-4-1-20250805', 'claude-sonnet-4-20250514', 'deepseek-ai/DeepSeek-V3.1', 'gemini-2.5-flash', 'gemini-2.5-pro', 'gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'grok-4-0709', 'grok-code-fast-1', 'meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'moonshotai/Kimi-K2-Instruct-0905', 'openai/gpt-oss-120b', 'zai-org/GLM-4.5-Air-FP8']",0.0 diff --git a/notebooks/output_token_analysis_pipeline/output_token_analysis.ipynb b/notebooks/output_token_analysis_pipeline/output_token_analysis.ipynb new file mode 100644 index 0000000..82ba1c8 --- /dev/null +++ b/notebooks/output_token_analysis_pipeline/output_token_analysis.ipynb @@ -0,0 +1,314 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Model Success vs. Avg Output Tokens\n", + "\n", + "1. **Extracts token usage** from result.json files in trial directories\n", + "2. **Combines with performance data** from difficulty analysis pipeline \n", + "3. **Analyzes token efficiency** - tokens per success, output tokens vs success rates\n", + "4. **Creates visualizations** showing relationships between token usage and performance\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "import json\n", + "from pathlib import Path\n", + "from datetime import datetime\n", + "import ast\n", + "from scipy import stats\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def extract_token_usage():\n", + " # TODO: Set path to your terminus2 data directory (output from get_terminus2_runs.py)\n", + " base_dir = Path(\"../../../../terminus2_9-17_essential_files\")\n", + " token_data = []\n", + " \n", + " for trial_dir in base_dir.iterdir():\n", + " if not trial_dir.is_dir():\n", + " continue\n", + " \n", + " result_file = trial_dir / \"result.json\"\n", + " if not result_file.exists():\n", + " continue\n", + " \n", + " try:\n", + " with open(result_file, 'r') as f:\n", + " result = json.load(f)\n", + " \n", + " trial_id = result.get('id')\n", + " model_name = result.get('agent_info', {}).get('model_info', {}).get('name')\n", + " task_name = result.get('task_name')\n", + " \n", + " verifier_result = result.get('verifier_result') or {}\n", + " reward = verifier_result.get('reward', 0) if isinstance(verifier_result, dict) else 0\n", + " \n", + " # Token data is in agent_result, not agent_execution\n", + " agent_result = result.get('agent_result', {})\n", + " if not agent_result:\n", + " continue\n", + " \n", + " input_tokens = agent_result.get('n_input_tokens', 0)\n", + " output_tokens = agent_result.get('n_output_tokens', 0)\n", + " \n", + " # Execution time is in agent_execution\n", + " agent_execution = result.get('agent_execution', {})\n", + " started_at = agent_execution.get('started_at')\n", + " finished_at = agent_execution.get('finished_at')\n", + " \n", + " execution_time = None\n", + " if started_at and finished_at:\n", + " start_dt = datetime.fromisoformat(started_at.replace('Z', '+00:00'))\n", + " end_dt = datetime.fromisoformat(finished_at.replace('Z', '+00:00'))\n", + " execution_time = (end_dt - start_dt).total_seconds()\n", + " \n", + " token_data.append({\n", + " 'trial_id': trial_id,\n", + " 'model_name': model_name,\n", + " 'task_name': task_name,\n", + " 'reward': reward,\n", + " 'success': reward > 0,\n", + " 'n_input_tokens': input_tokens,\n", + " 'n_output_tokens': output_tokens,\n", + " 'total_tokens': input_tokens + output_tokens,\n", + " 'execution_time_sec': execution_time\n", + " })\n", + " \n", + " except:\n", + " continue\n", + " \n", + " return pd.DataFrame(token_data)\n", + "\n", + "token_df = extract_token_usage()\n", + "print(f\"Extracted token data from {len(token_df)} trials\")\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def extract_provider_from_model(model_name):\n", + " if 'claude' in model_name.lower():\n", + " return 'Anthropic'\n", + " elif 'gpt' in model_name.lower() or 'openai' in model_name.lower():\n", + " return 'OpenAI'\n", + " elif 'gemini' in model_name.lower():\n", + " return 'Google'\n", + " elif 'deepseek' in model_name.lower():\n", + " return 'DeepSeek'\n", + " elif 'kimi' in model_name.lower() or 'moonshot' in model_name.lower():\n", + " return 'Moonshot'\n", + " elif 'qwen' in model_name.lower():\n", + " return 'Alibaba'\n", + " elif 'grok' in model_name.lower():\n", + " return 'xAI'\n", + " elif 'glm' in model_name.lower() or 'zai-org' in model_name.lower():\n", + " return 'Zhipu AI'\n", + " elif 'llama' in model_name.lower() or 'meta' in model_name.lower():\n", + " return 'Meta'\n", + " else:\n", + " return 'Other'\n", + "\n", + "def process_token_data(token_df):\n", + " model_summary = token_df.groupby('model_name').agg({\n", + " 'n_output_tokens': ['mean', 'std', 'sum'],\n", + " 'success': ['mean', 'count'],\n", + " 'execution_time_sec': 'mean'\n", + " }).round(3)\n", + " \n", + " model_summary.columns = [\n", + " 'avg_output_tokens', 'std_output_tokens', 'total_output_tokens',\n", + " 'success_rate', 'trial_count', 'avg_execution_time'\n", + " ]\n", + " \n", + " model_summary = model_summary[model_summary['trial_count'] >= 10].copy()\n", + " model_summary['provider'] = model_summary.index.map(extract_provider_from_model)\n", + " \n", + " return model_summary\n", + "\n", + "model_summary = process_token_data(token_df)\n", + "print(f\"Processed data for {len(model_summary)} models with >= 10 trials\")\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def simplify_model_name(model_name):\n", + " model_names = {\n", + " \"claude-sonnet-4-20250514\": \"Claude Sonnet 4\",\n", + " \"claude-opus-4-1-20250805\": \"Claude Opus 4.1\",\n", + " \"gpt-5\": \"GPT-5\",\n", + " \"gpt-5-mini\": \"GPT-5-Mini\",\n", + " \"gpt-5-nano\": \"GPT-5-Nano\",\n", + " \"grok-4-0709\": \"Grok 4\",\n", + " \"grok-code-fast-1\": \"Grok Code Fast 1\",\n", + " \"gemini-2.5-pro\": \"Gemini 2.5 Pro\",\n", + " \"gemini-2.5-flash\": \"Gemini 2.5 Flash\",\n", + " \"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8\": \"Qwen 3 Coder 480B\",\n", + " \"openai/gpt-oss-120b\": \"GPT-OSS 120B\",\n", + " \"OpenAI/gpt-oss-20B\": \"GPT-OSS 20B\",\n", + " \"moonshotai/Kimi-K2-Instruct-0905\": \"Kimi K2\",\n", + " \"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8\": \"Llama 4 Maverick 17B\",\n", + " \"zai-org/GLM-4.5-Air-FP8\": \"GLM 4.5 Air\",\n", + " \"deepseek-ai/DeepSeek-V3.1\": \"DeepSeek V3.1\",\n", + " }\n", + " return model_names.get(model_name, model_name)\n", + "\n", + "def create_token_success_plot(model_summary):\n", + " print(f\"Data summary:\")\n", + " print(f\"Models: {len(model_summary)}\")\n", + " print(f\"Output tokens range: {model_summary['avg_output_tokens'].min():.0f} - {model_summary['avg_output_tokens'].max():.0f}\")\n", + " print(f\"Success rate range: {model_summary['success_rate'].min():.3f} - {model_summary['success_rate'].max():.3f}\")\n", + " \n", + " # Check if we have enough variation in the data\n", + " if len(model_summary) < 2:\n", + " print(\"Not enough models for correlation analysis\")\n", + " return None, None\n", + " \n", + " if model_summary['avg_output_tokens'].std() == 0:\n", + " print(\"All models have same output tokens - no correlation possible\")\n", + " return None, None\n", + " \n", + " if model_summary['success_rate'].std() == 0:\n", + " print(\"All models have same success rate - no correlation possible\")\n", + " return None, None\n", + " \n", + " fig, ax = plt.subplots(figsize=(12, 8))\n", + " \n", + " provider_colors = {\n", + " 'OpenAI': '#d62728',\n", + " 'Anthropic': '#2ca02c', \n", + " 'Google': '#ff7f0e',\n", + " 'xAI': '#bcbd22',\n", + " 'DeepSeek': '#9467bd',\n", + " 'Meta': '#8c564b',\n", + " 'Moonshot': '#e377c2',\n", + " 'Alibaba': '#7f7f7f',\n", + " 'Zhipu AI': '#17becf',\n", + " 'Other': '#1f77b4'\n", + " }\n", + " \n", + " for provider in model_summary['provider'].unique():\n", + " provider_data = model_summary[model_summary['provider'] == provider]\n", + " ax.scatter(provider_data['avg_output_tokens'], provider_data['success_rate'],\n", + " c=provider_colors.get(provider, '#95A5A6'), \n", + " label=provider, s=100, alpha=0.7, edgecolors='black', linewidth=1)\n", + " \n", + " x = model_summary['avg_output_tokens']\n", + " y = model_summary['success_rate']\n", + " \n", + " # Try to calculate correlation and trend line with error handling\n", + " correlation, p_value = None, None\n", + " try:\n", + " correlation, p_value = stats.pearsonr(x, y)\n", + " \n", + " # Only add trend line if correlation is valid\n", + " if not np.isnan(correlation):\n", + " z = np.polyfit(x, y, 1)\n", + " p = np.poly1d(z)\n", + " ax.plot(x, p(x), \"r--\", alpha=0.8, linewidth=2, \n", + " label=f'Trend (r={correlation:.3f}, p={p_value:.3f})')\n", + " except:\n", + " print(\"Could not calculate correlation - data may be constant\")\n", + " \n", + " # Add model name labels\n", + " for _, row in model_summary.iterrows():\n", + " display_name = simplify_model_name(row['model_name'])\n", + " x_pos = row['avg_output_tokens']\n", + " y_pos = row['success_rate']\n", + " \n", + " ax.annotate(display_name, \n", + " (x_pos, y_pos),\n", + " xytext=(8, 0), textcoords='offset points',\n", + " fontsize=10, ha='left', va='center')\n", + " \n", + " ax.set_xlabel('Average Output Tokens', fontsize=12, fontweight='bold')\n", + " ax.set_ylabel('Success Rate', fontsize=12, fontweight='bold')\n", + " ax.set_title('Success Rate vs Output Tokens', fontsize=14, fontweight='bold')\n", + " \n", + " ax.grid(True, alpha=0.3)\n", + " ax.legend(bbox_to_anchor=(1.05, 1), loc='upper left')\n", + " \n", + " plt.tight_layout()\n", + " plt.savefig('results/success_vs_output_tokens.png', dpi=300, bbox_inches='tight')\n", + " plt.savefig('results/success_vs_output_tokens.pdf', dpi=300, bbox_inches='tight')\n", + " plt.show()\n", + " \n", + " return correlation, p_value\n", + "\n", + "Path(\"results\").mkdir(exist_ok=True)\n", + "correlation, p_value = create_token_success_plot(model_summary)\n", + "\n", + "if correlation is not None and p_value is not None:\n", + " print(f\"Correlation: {correlation:.3f}, p-value: {p_value:.3f}\")\n", + "else:\n", + " print(\"Could not calculate correlation statistics\")\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "model_summary.to_csv('results/model_token_summary.csv')\n", + "\n", + "provider_summary = model_summary.groupby('provider').agg({\n", + " 'avg_output_tokens': 'mean',\n", + " 'success_rate': 'mean',\n", + " 'trial_count': 'sum',\n", + " 'avg_execution_time': 'mean'\n", + "}).round(3)\n", + "\n", + "provider_summary.to_csv('results/provider_token_summary.csv')\n", + "\n", + "print(\"Saved files:\")\n", + "print(\"- model_token_summary.csv\")\n", + "print(\"- provider_token_summary.csv\")\n", + "print(\"- success_vs_output_tokens.png\")\n", + "print(\"- success_vs_output_tokens.pdf\")\n" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": ".venv", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.13.5" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/notebooks/output_token_analysis_pipeline/results/model_token_summary.csv b/notebooks/output_token_analysis_pipeline/results/model_token_summary.csv new file mode 100644 index 0000000..b2d70e2 --- /dev/null +++ b/notebooks/output_token_analysis_pipeline/results/model_token_summary.csv @@ -0,0 +1,17 @@ +model_name,avg_input_tokens,std_input_tokens,total_input_tokens,avg_output_tokens,std_output_tokens,total_output_tokens,avg_total_tokens,std_total_tokens,total_all_tokens,success_rate,trial_count,avg_execution_time +OpenAI/gpt-oss-20B,1959.043,2396.797,724846,5220.678,8570.833,1931651,7179.722,10685.421,2656497,0.022,370,458.837 +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,11984.381,10899.494,4470174,7690.15,7581.654,2868426,19674.531,17832.17,7338600,0.182,373,979.649 +claude-opus-4-1-20250805,13187.472,12669.744,7661921,9154.542,11323.978,5318789,22342.014,23413.549,12980710,0.334,581,842.141 +claude-sonnet-4-20250514,11510.394,9870.181,4235825,7510.769,6605.042,2763963,19021.163,15748.775,6999788,0.293,368,900.255 +deepseek-ai/DeepSeek-V3.1,11719.862,9994.743,4324629,7578.585,7752.439,2796498,19298.447,17055.243,7121127,0.225,369,821.944 +gemini-2.5-flash,10588.9,13732.032,3928482,12355.544,19644.816,4583907,22944.445,31436.818,8512389,0.119,371,901.462 +gemini-2.5-pro,9311.374,8524.477,3435897,5760.295,7759.136,2125549,15071.669,15217.249,5561446,0.271,369,838.168 +gpt-5,8003.887,6814.275,3553726,7244.876,8833.919,3216725,15248.764,14628.443,6770451,0.342,444,866.216 +gpt-5-mini,8833.747,8853.105,3241985,8133.232,9927.629,2984896,16966.978,18224.314,6226881,0.204,367,913.615 +gpt-5-nano,10810.393,9850.716,3989035,10083.995,10144.839,3720994,20894.388,18896.734,7710029,0.089,369,1131.244 +grok-4-0709,6227.531,6359.392,2297959,3365.954,4466.984,1242037,9593.485,9996.991,3539996,0.206,369,1010.396 +grok-code-fast-1,5936.671,5185.559,2202505,3159.027,3099.79,1171999,9095.698,7714.732,3374504,0.132,371,456.191 +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,8508.352,11418.915,3139582,3762.491,3967.62,1388359,12270.843,14916.197,4527941,0.065,369,545.83 +moonshotai/Kimi-K2-Instruct-0905,12300.351,11064.253,4588031,8263.18,7526.13,3082166,20563.531,17891.589,7670197,0.214,373,955.649 +openai/gpt-oss-120b,6135.778,6044.209,2239559,4957.871,5707.363,1809623,11093.649,11082.198,4049182,0.148,365,613.336 +zai-org/GLM-4.5-Air-FP8,12541.348,11057.971,4652840,9326.097,8545.432,3459982,21867.445,18239.253,8112822,0.14,371,816.14 diff --git a/notebooks/output_token_analysis_pipeline/results/provider_token_summary.csv b/notebooks/output_token_analysis_pipeline/results/provider_token_summary.csv new file mode 100644 index 0000000..1f10725 --- /dev/null +++ b/notebooks/output_token_analysis_pipeline/results/provider_token_summary.csv @@ -0,0 +1,6 @@ +provider,avg_input_tokens,std_input_tokens,total_input_tokens,avg_output_tokens,std_output_tokens,total_output_tokens,avg_total_tokens,std_total_tokens,total_all_tokens,success_rate,trial_count,avg_execution_time +anthropic,12537.14,11687.293,11897746,8517.125,9797.235,8082752,21054.266,20833.428,19980498,0.318,949,864.676 +gemini,9951.864,11445.801,7364379,9066.832,15299.979,6709456,19018.696,25012.671,14073835,0.195,740,869.901 +openai,9139.615,8570.574,10784746,8408.996,9667.135,9922615,17548.611,17336.838,20707361,0.22,1180,963.835 +together_ai,9320.332,10232.273,24139661,6693.708,7498.385,17336705,16014.041,16542.738,41476366,0.142,2590,742.471 +xai,6081.708,5798.554,4500464,3262.211,3841.62,2414036,9343.919,8923.447,6914500,0.169,740,732.544 diff --git a/notebooks/output_token_analysis_pipeline/results/success_vs_output_tokens.pdf b/notebooks/output_token_analysis_pipeline/results/success_vs_output_tokens.pdf new file mode 100644 index 0000000..683a9b6 Binary files /dev/null and b/notebooks/output_token_analysis_pipeline/results/success_vs_output_tokens.pdf differ diff --git a/notebooks/output_token_analysis_pipeline/results/success_vs_output_tokens.png b/notebooks/output_token_analysis_pipeline/results/success_vs_output_tokens.png new file mode 100644 index 0000000..5d38863 Binary files /dev/null and b/notebooks/output_token_analysis_pipeline/results/success_vs_output_tokens.png differ diff --git a/notebooks/output_token_analysis_pipeline/results/task_token_summary.csv b/notebooks/output_token_analysis_pipeline/results/task_token_summary.csv new file mode 100644 index 0000000..db8ff03 --- /dev/null +++ b/notebooks/output_token_analysis_pipeline/results/task_token_summary.csv @@ -0,0 +1,75 @@ +task_name,avg_input_tokens,std_input_tokens,avg_output_tokens,std_output_tokens,avg_total_tokens,std_total_tokens,success_rate,trial_count,avg_execution_time +adaptive-rejection-sampler,9183.542,4161.453,9002.217,6385.061,18185.759,8863.874,0.108,83,786.444 +bn-fit-modify,16394.512,9810.175,10845.262,10007.526,27239.774,17812.782,0.25,84,1365.082 +break-filter-js-from-html,5584.151,4607.83,6056.419,5223.179,11640.57,9687.021,0.07,86,755.555 +build-cython-ext,13551.88,5635.135,5448.361,3209.982,19000.241,7075.307,0.012,83,823.956 +build-initramfs-qemu,5783.676,5510.737,3841.704,2557.165,9625.38,7586.706,0.0,71,544.652 +build-pmars,11535.771,5312.788,4704.012,3067.487,16239.783,7155.221,0.542,83,693.679 +build-pov-ray,18762.843,12833.725,12542.386,14637.326,31305.229,24471.355,0.337,83,2252.415 +cancel-async-tasks,2487.867,3347.51,2072.831,4236.314,4560.699,7544.181,0.361,83,254.164 +chess-best-move,9706.635,5482.424,6159.624,3890.598,15866.259,8505.186,0.0,85,594.471 +circuit-fibsqrt,18915.75,15887.294,25325.964,24673.44,44241.714,37781.875,0.048,84,2135.446 +cobol-modernization,7867.738,4619.624,6694.202,4893.023,14561.94,9169.413,0.583,84,647.164 +code-from-image,10601.169,8219.201,7749.578,7280.605,18350.747,15076.218,0.253,83,672.54 +configure-git-webserver,6045.548,2346.025,2217.464,1267.782,8263.012,3304.735,0.429,84,451.294 +constraints-scheduling,5642.291,3488.338,4705.779,3524.522,10348.07,6835.655,0.721,86,401.496 +count-dataset-tokens,10404.905,4383.928,4288.738,2088.391,14693.643,5053.81,0.024,84,682.087 +crack-7z-hash,8804.36,4710.155,3713.791,2089.385,12518.151,6393.88,0.465,86,468.707 +db-wal-recovery,5439.593,4088.903,5554.244,3603.438,10993.837,6780.914,0.023,86,612.106 +distribution-search,12052.588,11126.675,12885.788,13799.708,24938.376,24538.476,0.341,85,1104.883 +dna-assembly,10145.548,6232.93,7442.345,5152.376,17587.893,10299.724,0.0,84,571.913 +dna-insert,7471.548,5158.202,4390.905,3348.264,11862.452,7420.837,0.0,84,377.99 +extract-elf,6435.419,4827.268,3485.093,2475.985,9920.512,6648.269,0.407,86,361.398 +feal-differential-cryptanalysis,10260.373,10576.331,11437.554,12502.187,21697.928,22408.426,0.096,83,854.631 +feal-linear-cryptanalysis,15331.314,8204.789,16266.895,10339.788,31598.209,16822.711,0.105,86,1442.42 +filter-js-from-html,4357.651,3967.394,4457.395,4417.707,8815.047,7997.704,0.0,86,394.898 +financial-document-processor,10510.0,6164.39,6036.714,4186.933,16546.714,9892.573,0.012,84,583.616 +fix-code-vulnerability,11657.607,6470.682,6482.5,3612.443,18140.107,8838.158,0.131,84,801.467 +fix-git,4868.837,3264.13,2715.593,1778.886,7584.43,4674.079,0.698,86,351.226 +fix-ocaml-gc,32869.446,18986.214,18819.928,12242.479,51689.373,27460.686,0.06,83,3008.228 +form-filling,8378.699,5285.433,8332.819,8022.162,16711.518,12859.704,0.59,83,450.998 +git-leak-recovery,2912.291,1877.633,2516.372,1833.869,5428.663,3572.333,0.616,86,319.109 +gpt2-codegolf,6516.349,6362.41,6530.747,5123.224,13047.096,11157.328,0.0,83,584.129 +hf-model-inference,5412.69,2755.896,2977.476,2369.971,8390.167,4686.722,0.512,84,425.103 +install-klee-minimal,10249.857,5807.159,2715.893,1871.849,12965.75,6316.906,0.0,84,892.339 +install-windows-3.11,8789.79,5637.779,6036.963,9131.686,14826.753,12993.759,0.0,81,841.276 +large-scale-text-editing,5113.5,3527.271,4831.174,3379.049,9944.674,6259.843,0.198,86,715.538 +largest-eigenval,8151.205,4397.735,6530.735,3549.328,14681.94,7655.999,0.06,83,792.718 +log-summary-date-ranges,6393.209,3348.494,3028.14,2578.859,9421.349,5368.095,0.314,86,224.015 +make-doom-for-mips,15244.186,7313.597,5326.012,2722.344,20570.198,8882.767,0.0,86,856.873 +make-mips-interpreter,22068.325,12281.701,23991.133,14490.41,46059.458,21897.404,0.0,83,1704.065 +merge-diff-arc-agi-task,10868.849,6008.19,5693.605,4173.081,16562.453,9710.534,0.291,86,620.743 +model-extraction-relu-logits,4612.738,4173.486,4036.869,3696.77,8649.607,7704.033,0.071,84,478.149 +mteb-leaderboard,10613.301,12394.097,7353.458,11099.627,17966.759,22119.563,0.0,83,886.108 +mteb-retrieve,3352.155,3814.754,2231.75,2854.139,5583.905,6497.238,0.0,84,298.465 +nginx-request-logging,4826.69,1562.973,3091.655,2393.633,7918.345,3511.287,0.5,84,392.873 +openssl-selfsigned-cert,3084.0,1684.833,2519.476,2024.524,5603.476,3668.043,0.524,84,226.844 +password-recovery,4818.977,2679.0,4695.105,2391.265,9514.081,4447.722,0.116,86,822.104 +path-tracing,11415.12,12410.635,10044.831,10559.905,21459.952,21972.36,0.012,83,1045.419 +path-tracing-reverse,16743.619,13727.698,12986.548,9996.51,29730.167,22806.208,0.012,84,1219.862 +polyglot-c-py,5691.238,7274.526,5464.298,6469.71,11155.536,13073.5,0.048,84,513.514 +polyglot-rust-c,5648.096,5149.473,6234.639,5627.488,11882.735,10654.25,0.0,83,704.382 +port-compressor,41219.465,25136.328,34419.233,19900.245,75638.698,41679.973,0.012,86,3196.049 +prove-plus-comm,2471.256,1513.801,2531.826,2240.575,5003.081,3684.174,0.663,86,341.061 +pypi-server,5866.798,3929.936,3007.857,2203.771,8874.655,5746.63,0.476,84,427.736 +pytorch-model-cli,6674.892,5294.467,4149.072,3079.792,10823.964,7737.753,0.12,83,481.068 +pytorch-model-recovery,10663.965,5482.2,8684.953,4765.994,19348.918,9205.485,0.471,85,693.46 +qemu-alpine-ssh,2518.434,1274.948,3464.494,2327.35,5982.928,3334.032,0.157,83,578.046 +qemu-startup,2560.854,2730.714,2512.683,2022.604,5073.537,4230.129,0.28,82,480.642 +regex-log,2460.354,2061.84,2244.988,2149.682,4705.341,4146.232,0.439,82,267.606 +reshard-c4-data,6847.185,3896.795,5792.012,3752.124,12639.198,7256.112,0.025,81,617.392 +reverse-engineering,15992.238,11227.678,12614.25,11435.36,28606.488,21237.874,0.095,84,1620.234 +run-pdp11-code,6627.61,4322.427,4833.488,3357.998,11461.098,7093.743,0.0,82,742.973 +sanitize-git-repo,9156.059,5367.246,3461.941,2142.098,12618.0,6849.576,0.024,85,546.928 +schemelike-metacircular-eval,18621.134,12918.601,21160.402,16858.009,39781.537,28240.241,0.024,82,1705.127 +sparql-university,5456.622,3124.541,2792.073,2076.83,8248.695,4942.519,0.122,82,371.516 +sqlite-db-truncate,5023.988,2688.471,4025.2,2406.118,9049.188,4865.883,0.012,85,451.009 +sqlite-with-gcov,7443.795,4000.523,2371.723,2583.694,9815.518,5400.562,0.47,83,404.705 +torch-tensor-parallelism,3786.012,3712.744,2744.434,1983.906,6530.446,5315.308,0.0,83,285.298 +train-fasttext,20995.805,12557.522,10207.585,6400.98,31203.39,15717.079,0.061,82,2893.165 +tune-mjcf,8890.776,4114.678,7897.471,3616.388,16788.247,7029.962,0.141,85,829.488 +video-processing,4218.146,2894.0,3735.902,2787.462,7954.049,5564.539,0.0,82,276.999 +vulnerable-secret,6217.859,4192.066,5751.024,5319.715,11968.882,7612.159,0.294,85,723.133 +wasm-pipeline,8439.181,4484.565,5252.349,2923.095,13691.53,6487.176,0.301,83,583.73 +winning-avg-corewars,17315.073,12442.409,17002.159,13267.554,34317.232,25411.087,0.073,82,2183.03 +write-compressor,7325.47,5563.372,7513.265,6644.994,14838.735,10854.736,0.024,83,838.518 diff --git a/notebooks/output_token_analysis_pipeline/results/trial_token_usage.csv b/notebooks/output_token_analysis_pipeline/results/trial_token_usage.csv new file mode 100644 index 0000000..ec030ad --- /dev/null +++ b/notebooks/output_token_analysis_pipeline/results/trial_token_usage.csv @@ -0,0 +1,6200 @@ +trial_id,model_name,provider,task_name,n_input_tokens,n_output_tokens,total_tokens,execution_time_sec,success,reward,model_name_perf,task_name_perf,execution_time_perf,success_perf,model_success_rate,final_success,final_execution_time +54242fbe-3b51-49f3-ae49-4c54c815aa61,gemini-2.5-pro,gemini,fix-ocaml-gc,36693,10994,47687,3600.464048,False,0.0,gemini-2.5-pro,fix-ocaml-gc,3600.464048,False,0.2,False,3600.464048 +ba1cb721-476c-4678-b6d9-a32c574299f9,OpenAI/gpt-oss-20B,together_ai,git-leak-recovery,492,970,1462,98.778482,False,0.0,OpenAI/gpt-oss-20B,git-leak-recovery,98.778482,False,0.0,False,98.778482 +7bb024c7-011a-4b66-8e79-188a2df3f5cf,deepseek-ai/DeepSeek-V3.1,together_ai,largest-eigenval,2803,1597,4400,909.685033,False,0.0,deepseek-ai/DeepSeek-V3.1,largest-eigenval,909.685033,False,0.2,False,909.685033 +1a3cec9b-b4a1-45e8-b8b6-6d957408a37a,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing,9056,8736,17792,840.989617,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing,840.989617,False,0.0,False,840.989617 +412632cc-aac1-47d1-85bd-1afd32e384f6,gpt-5,openai,write-compressor,1894,2690,4584,900.250943,False,0.0,gpt-5,write-compressor,900.250943,False,0.3333333333333333,False,900.250943 +4df4f348-712f-4adb-87c3-ee00917faad0,grok-4-0709,xai,dna-assembly,1157,286,1443,756.442839,False,0.0,grok-4-0709,dna-assembly,756.442839,False,0.0,False,756.442839 +cc28009f-3117-4466-a75f-6fb0cf402b6e,OpenAI/gpt-oss-20B,together_ai,feal-linear-cryptanalysis,3352,13885,17237,1042.670139,False,0.0,OpenAI/gpt-oss-20B,feal-linear-cryptanalysis,1042.670139,False,0.0,False,1042.670139 +52dd0a42-0529-4ff2-b822-33120fb18a63,deepseek-ai/DeepSeek-V3.1,together_ai,constraints-scheduling,5578,4056,9634,462.471271,True,1.0,deepseek-ai/DeepSeek-V3.1,constraints-scheduling,462.471271,True,0.8,True,462.471271 +c6eba79c-375a-4a82-b0d0-2e34e1e30e1f,gpt-5,openai,log-summary-date-ranges,5777,2040,7817,203.376941,False,0.0,gpt-5,log-summary-date-ranges,203.376941,False,0.0,False,203.376941 +79af95f8-2276-4ddc-8c39-6a015faa4b2f,claude-opus-4-1-20250805,anthropic,sqlite-with-gcov,9153,1444,10597,265.550426,True,1.0,claude-opus-4-1-20250805,sqlite-with-gcov,265.550426,True,0.5714285714285714,True,265.550426 +b15502e6-690f-4df9-8953-ab33fa8268ca,grok-code-fast-1,xai,mteb-retrieve,3552,781,4333,210.914319,False,0.0,grok-code-fast-1,mteb-retrieve,210.914319,False,0.0,False,210.914319 +2e7251cd-ee3a-49ba-b2c0-62d85843a04d,gpt-5-mini,openai,polyglot-rust-c,5555,7437,12992,900.035667,False,0.0,gpt-5-mini,polyglot-rust-c,900.035667,False,0.0,False,900.035667 +a303cc65-3e71-4a94-b4d6-59f9ca84cec7,gpt-5-nano,openai,adaptive-rejection-sampler,12280,10786,23066,818.893071,True,1.0,gpt-5-nano,adaptive-rejection-sampler,818.893071,True,0.2,True,818.893071 +11e10566-b462-43f1-9216-f805f03f0392,OpenAI/gpt-oss-20B,together_ai,db-wal-recovery,1112,832,1944,148.530202,False,0.0,OpenAI/gpt-oss-20B,db-wal-recovery,148.530202,False,0.0,False,148.530202 +6d78f7f4-c47b-4ef8-bd35-af7adb9617fe,gpt-5,openai,fix-ocaml-gc,33403,30131,63534,3604.829114,False,0.0,gpt-5,fix-ocaml-gc,3604.829114,False,0.0,False,3604.829114 +f518223a-567a-41ab-9390-086a69abdc56,claude-opus-4-1-20250805,anthropic,crack-7z-hash,9388,4956,14344,581.221997,True,1.0,claude-opus-4-1-20250805,crack-7z-hash,581.221997,True,0.8888888888888888,True,581.221997 +cfb5cedd-b5b0-4924-9646-1a0336e467e6,gpt-5-mini,openai,pytorch-model-cli,1624,1725,3349,181.859916,False,0.0,gpt-5-mini,pytorch-model-cli,181.859916,False,0.0,False,181.859916 +9d5422f4-bec8-404d-a9cc-0bf3c605f097,claude-opus-4-1-20250805,anthropic,torch-tensor-parallelism,11827,5215,17042,488.326042,False,0.0,claude-opus-4-1-20250805,torch-tensor-parallelism,488.326042,False,0.0,False,488.326042 +88992378-e256-42d9-9358-2d0596158f62,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,constraints-scheduling,5284,4303,9587,391.482547,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,constraints-scheduling,391.482547,False,0.0,False,391.482547 +e2113bfb-9d33-4d24-a0c8-26f95f4e9b77,zai-org/GLM-4.5-Air-FP8,together_ai,db-wal-recovery,3364,5431,8795,910.990073,False,0.0,zai-org/GLM-4.5-Air-FP8,db-wal-recovery,910.990073,False,0.0,False,910.990073 +f24bd6b7-733a-493d-976c-c9cf80698bf4,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-git,6606,4032,10638,347.422022,True,1.0,moonshotai/Kimi-K2-Instruct-0905,fix-git,347.422022,True,1.0,True,347.422022 +b85060d9-03a4-4ffc-9d45-20e52f5e6f1b,moonshotai/Kimi-K2-Instruct-0905,together_ai,db-wal-recovery,3809,5735,9544,303.838788,False,0.0,moonshotai/Kimi-K2-Instruct-0905,db-wal-recovery,303.838788,False,0.0,False,303.838788 +e1f3454c-6284-4983-bfe5-99d1d71346de,claude-opus-4-1-20250805,anthropic,pytorch-model-recovery,12483,3585,16068,511.260645,True,1.0,claude-opus-4-1-20250805,pytorch-model-recovery,511.260645,True,1.0,True,511.260645 +dde7b849-23fd-4465-910e-b76d98eb7d13,deepseek-ai/DeepSeek-V3.1,together_ai,regex-log,2878,2859,5737,144.65089,False,0.0,deepseek-ai/DeepSeek-V3.1,regex-log,144.65089,False,0.2,False,144.65089 +d1e0f468-3b22-4fbf-8c21-d314570033a4,gpt-5-mini,openai,path-tracing-reverse,14672,9768,24440,1150.946894,False,0.0,gpt-5-mini,path-tracing-reverse,1150.946894,False,0.0,False,1150.946894 +d1c575cd-dc0e-4807-9d7c-0d5ffc7dc04a,claude-sonnet-4-20250514,anthropic,sqlite-db-truncate,4764,3222,7986,203.612365,False,0.0,claude-sonnet-4-20250514,sqlite-db-truncate,203.612365,False,0.0,False,203.612365 +56dc328c-31f0-410c-ac75-12da0e370794,OpenAI/gpt-oss-20B,together_ai,git-leak-recovery,483,2054,2537,254.141303,False,0.0,OpenAI/gpt-oss-20B,git-leak-recovery,254.141303,False,0.0,False,254.141303 +00b1bab2-2ddb-409b-881d-96e44d4a6b59,grok-4-0709,xai,adaptive-rejection-sampler,5052,2976,8028,931.346731,False,0.0,grok-4-0709,adaptive-rejection-sampler,931.346731,False,0.0,False,931.346731 +3c9a3346-5d8d-46dc-a9a5-c38e1c76844f,gemini-2.5-pro,gemini,count-dataset-tokens,19112,4537,23649,905.098183,False,0.0,gemini-2.5-pro,count-dataset-tokens,905.098183,False,0.0,False,905.098183 +ef316108-fd79-4334-97c5-64cd1a5a4141,deepseek-ai/DeepSeek-V3.1,together_ai,winning-avg-corewars,13818,9820,23638,851.993879,False,0.0,deepseek-ai/DeepSeek-V3.1,winning-avg-corewars,851.993879,False,0.0,False,851.993879 +27d6791b-6b93-481f-a9e5-3da67c2c0004,grok-4-0709,xai,port-compressor,20293,30944,51237,3602.36234,False,0.0,grok-4-0709,port-compressor,3602.36234,False,0.0,False,3602.36234 +1a0eeb4e-7643-4cfe-8e00-546c0bede239,deepseek-ai/DeepSeek-V3.1,together_ai,make-doom-for-mips,5884,733,6617,972.667,False,0.0,deepseek-ai/DeepSeek-V3.1,make-doom-for-mips,972.667,False,0.0,False,972.667 +d82801ba-982d-453a-93f1-1638700e8aa1,gemini-2.5-flash,gemini,feal-linear-cryptanalysis,22440,58364,80804,1811.558613,False,0.0,gemini-2.5-flash,feal-linear-cryptanalysis,1811.558613,False,0.0,False,1811.558613 +5f19aed8-745f-4ecc-a3c8-ccd641e44220,claude-opus-4-1-20250805,anthropic,prove-plus-comm,2268,1556,3824,300.181889,True,1.0,claude-opus-4-1-20250805,prove-plus-comm,300.181889,True,1.0,True,300.181889 +c60e38e2-9509-4fb1-85eb-7a681c57cf4c,openai/gpt-oss-120b,together_ai,filter-js-from-html,1492,1408,2900,423.723401,False,0.0,openai/gpt-oss-120b,filter-js-from-html,423.723401,False,0.0,False,423.723401 +493ad8a8-e41a-4ce8-963a-9c55de766bb9,gpt-5-nano,openai,pytorch-model-recovery,7393,8339,15732,872.056794,False,0.0,gpt-5-nano,pytorch-model-recovery,872.056794,False,0.0,False,872.056794 +a1563cd0-f27b-4475-acd3-bf58905e134c,gemini-2.5-pro,gemini,pypi-server,6158,2851,9009,514.246346,True,1.0,gemini-2.5-pro,pypi-server,514.246346,True,0.8,True,514.246346 +af7fd4f3-e0ce-41f6-a564-8d9fc25b5adf,grok-code-fast-1,xai,reverse-engineering,8065,3640,11705,1829.960162,False,0.0,grok-code-fast-1,reverse-engineering,1829.960162,False,0.0,False,1829.960162 +0e937de3-87c8-4ecc-a861-41a9c8ebccef,gemini-2.5-pro,gemini,cancel-async-tasks,1459,897,2356,91.541084,False,0.0,gemini-2.5-pro,cancel-async-tasks,91.541084,False,0.0,False,91.541084 +308ba5ce-bf4f-44ed-ae89-4e40c60681f6,gemini-2.5-flash,gemini,reverse-engineering,10464,21489,31953,1802.238321,False,0.0,gemini-2.5-flash,reverse-engineering,1802.238321,False,0.0,False,1802.238321 +d9d92238-1c00-4e5f-9338-75bf9c7b971d,gpt-5-nano,openai,large-scale-text-editing,5113,8911,14024,1200.415566,False,0.0,gpt-5-nano,large-scale-text-editing,1200.415566,False,0.0,False,1200.415566 +c16c931c-8084-469c-80e6-14104a705635,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-rust-c,13473,13584,27057,900.023997,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-rust-c,900.023997,False,0.0,False,900.023997 +0e2711e5-345c-4aaa-8afe-0d6d7c44d441,gpt-5-mini,openai,mteb-retrieve,2945,2150,5095,290.868252,False,0.0,gpt-5-mini,mteb-retrieve,290.868252,False,0.0,False,290.868252 +b8a17eea-4b3f-43e5-8c6c-15f0677e92c9,grok-4-0709,xai,password-recovery,7096,2883,9979,903.627722,False,0.0,grok-4-0709,password-recovery,903.627722,False,0.0,False,903.627722 +6756bf43-ec57-4ec9-806e-5c4663836e90,claude-opus-4-1-20250805,anthropic,extract-elf,5070,2283,7353,232.32937,True,1.0,claude-opus-4-1-20250805,extract-elf,232.32937,True,0.8888888888888888,True,232.32937 +5cedf39e-3a28-4040-bdaf-909a91d9efd3,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-with-gcov,9446,1831,11277,415.302093,True,1.0,deepseek-ai/DeepSeek-V3.1,sqlite-with-gcov,415.302093,True,0.8,True,415.302093 +4ab88066-e885-44a2-9c24-94c635a3f7f6,gpt-5,openai,torch-tensor-parallelism,2947,2693,5640,204.641127,False,0.0,gpt-5,torch-tensor-parallelism,204.641127,False,0.0,False,204.641127 +6d21b2e1-3b18-4728-a7df-9fc83f20760c,gemini-2.5-flash,gemini,nginx-request-logging,3776,1311,5087,226.678299,False,0.0,gemini-2.5-flash,nginx-request-logging,226.678299,False,0.0,False,226.678299 +0a5ea382-2579-4a5b-8712-3adaaac0f7a5,openai/gpt-oss-120b,together_ai,model-extraction-relu-logits,1531,3036,4567,85.651858,False,0.0,openai/gpt-oss-120b,model-extraction-relu-logits,85.651858,False,0.0,False,85.651858 +7500d5de-a64f-4104-a6e6-002c45ce48b3,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing,13337,11761,25098,1805.165513,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing,1805.165513,False,0.0,False,1805.165513 +d5200423-de2e-409f-b3ad-204bc2d297fd,gpt-5,openai,break-filter-js-from-html,2843,2313,5156,161.146064,False,0.0,gpt-5,break-filter-js-from-html,161.146064,False,0.4285714285714285,False,161.146064 +9c26cd4c-dec9-40b5-8ef6-93a5b6d08c0b,gpt-5-nano,openai,path-tracing,16670,20924,37594,1800.037215,True,1.0,gpt-5-nano,path-tracing,1800.037215,True,0.2,True,1800.037215 +1d595ab4-6d13-4782-a2aa-d16f21026d9d,grok-4-0709,xai,vulnerable-secret,6076,2550,8626,767.651047,True,1.0,grok-4-0709,vulnerable-secret,767.651047,True,0.6,True,767.651047 +c4add67a-b81a-4dfa-a5e3-df08871b753d,gpt-5,openai,dna-assembly,13954,13219,27173,666.00144,False,0.0,gpt-5,dna-assembly,666.00144,False,0.0,False,666.00144 +0537cba9-14d9-426b-accc-b07c2542ec08,gpt-5-nano,openai,prove-plus-comm,2595,2365,4960,291.844602,True,1.0,gpt-5-nano,prove-plus-comm,291.844602,True,0.4,True,291.844602 +97fbbc39-736d-4f5c-9f68-baf75a97efd1,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-with-gcov,12796,2772,15568,528.388895,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-with-gcov,528.388895,True,0.6,True,528.388895 +7c46e0ff-7e20-4818-99a6-696ba088760a,claude-sonnet-4-20250514,anthropic,sanitize-git-repo,26944,7681,34625,769.707821,False,0.0,claude-sonnet-4-20250514,sanitize-git-repo,769.707821,False,0.0,False,769.707821 +5faa7bb1-2260-4e2f-907c-9f5311f64452,grok-code-fast-1,xai,log-summary-date-ranges,6979,2586,9565,166.377165,False,0.0,grok-code-fast-1,log-summary-date-ranges,166.377165,False,0.0,False,166.377165 +0d9ebbae-d083-4cab-b55e-e8c42ab9fddb,claude-sonnet-4-20250514,anthropic,feal-linear-cryptanalysis,27460,23562,51022,1800.001266,False,0.0,claude-sonnet-4-20250514,feal-linear-cryptanalysis,1800.001266,False,0.0,False,1800.001266 +efc8bdeb-3d7c-4ef9-97e8-70d3279745c8,moonshotai/Kimi-K2-Instruct-0905,together_ai,configure-git-webserver,7666,4650,12316,789.772052,False,0.0,moonshotai/Kimi-K2-Instruct-0905,configure-git-webserver,789.772052,False,0.6,False,789.772052 +2ef87912-4090-4887-afdb-34d376586e6c,gpt-5,openai,pytorch-model-cli,2538,2444,4982,268.154951,False,0.0,gpt-5,pytorch-model-cli,268.154951,False,0.0,False,268.154951 +9989cbee-0411-4a8c-9f62-b919f07eeb0c,moonshotai/Kimi-K2-Instruct-0905,together_ai,torch-tensor-parallelism,3632,2632,6264,633.499363,False,0.0,moonshotai/Kimi-K2-Instruct-0905,torch-tensor-parallelism,633.499363,False,0.0,False,633.499363 +b889594d-fbf7-421d-a79d-5e87e8e7a6ee,openai/gpt-oss-120b,together_ai,db-wal-recovery,3840,4874,8714,348.080385,False,0.0,openai/gpt-oss-120b,db-wal-recovery,348.080385,False,0.0,False,348.080385 +a02f0adf-75cb-4835-9ebe-6ca02233115a,grok-code-fast-1,xai,mteb-retrieve,3593,858,4451,217.240875,False,0.0,grok-code-fast-1,mteb-retrieve,217.240875,False,0.0,False,217.240875 +b5a614e8-c774-4f8b-b82e-053e135e475a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-with-gcov,5586,1781,7367,123.837943,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-with-gcov,123.837943,True,0.4,True,123.837943 +f42c6a34-07c6-44bb-991f-1d45c2020542,deepseek-ai/DeepSeek-V3.1,together_ai,cobol-modernization,9022,6680,15702,512.576236,True,1.0,deepseek-ai/DeepSeek-V3.1,cobol-modernization,512.576236,True,0.6,True,512.576236 +52d812e1-f65d-4f7d-9439-fccec6a7872b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-linear-cryptanalysis,3245,2994,6239,659.535679,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-linear-cryptanalysis,659.535679,False,0.0,False,659.535679 +7f2ea6f9-620a-4ce9-b4dd-85defc41c11f,openai/gpt-oss-120b,together_ai,prove-plus-comm,1635,869,2504,141.927923,True,1.0,openai/gpt-oss-120b,prove-plus-comm,141.927923,True,1.0,True,141.927923 +7f6e296e-e065-41d3-bf73-e5dc2eaca4a8,grok-4-0709,xai,feal-differential-cryptanalysis,2349,1225,3574,731.298854,True,1.0,grok-4-0709,feal-differential-cryptanalysis,731.298854,True,0.8,True,731.298854 +02985f59-ddc1-48cd-8403-66aff8fc2126,deepseek-ai/DeepSeek-V3.1,together_ai,write-compressor,1698,1063,2761,939.336987,False,0.0,deepseek-ai/DeepSeek-V3.1,write-compressor,939.336987,False,0.0,False,939.336987 +af4bc0ae-2786-4af7-8c9c-6d8b1cd1c03f,gpt-5,openai,qemu-alpine-ssh,3207,4017,7224,960.243697,False,0.0,gpt-5,qemu-alpine-ssh,960.243697,False,0.1666666666666666,False,960.243697 +d7be9106-ba94-4e23-963b-6117831f4c34,grok-4-0709,xai,schemelike-metacircular-eval,13900,14325,28225,1481.990202,False,0.0,grok-4-0709,schemelike-metacircular-eval,1481.990202,False,0.0,False,1481.990202 +268e8eec-16aa-4301-be7e-3a7ef529fc80,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-git,3602,1392,4994,551.904755,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-git,551.904755,False,0.0,False,551.904755 +6ef1dad1-d823-42e5-a1e3-117d483db278,gpt-5-nano,openai,qemu-alpine-ssh,3059,4861,7920,921.555876,False,0.0,gpt-5-nano,qemu-alpine-ssh,921.555876,False,0.0,False,921.555876 +fa24fa9b-a773-4b3b-8488-c22d34301de8,gemini-2.5-flash,gemini,configure-git-webserver,6684,1691,8375,144.130926,False,0.0,gemini-2.5-flash,configure-git-webserver,144.130926,False,0.0,False,144.130926 +d3ff7723-523c-4868-a5e4-9b0e23e2b571,OpenAI/gpt-oss-20B,together_ai,qemu-alpine-ssh,2732,5691,8423,238.233703,False,0.0,OpenAI/gpt-oss-20B,qemu-alpine-ssh,238.233703,False,0.0,False,238.233703 +7719f772-f6ea-4bc5-b035-970d7c57a200,moonshotai/Kimi-K2-Instruct-0905,together_ai,sanitize-git-repo,12011,3963,15974,602.871666,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sanitize-git-repo,602.871666,False,0.0,False,602.871666 +b9edcdc2-de44-4cfd-9c9f-f591c72ab802,grok-code-fast-1,xai,polyglot-c-py,1494,1280,2774,428.017157,False,0.0,grok-code-fast-1,polyglot-c-py,428.017157,False,0.0,False,428.017157 +2e924e64-1325-40a9-9c8d-903d02435aa3,gemini-2.5-flash,gemini,break-filter-js-from-html,1800,1276,3076,132.207215,False,0.0,gemini-2.5-flash,break-filter-js-from-html,132.207215,False,0.0,False,132.207215 +804384d0-f540-4ce8-86db-7b9e66721dbc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,openssl-selfsigned-cert,2341,1054,3395,122.044992,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,openssl-selfsigned-cert,122.044992,False,0.0,False,122.044992 +28314033-4e01-41a9-8e62-6e6cdc102943,claude-sonnet-4-20250514,anthropic,large-scale-text-editing,3160,2771,5931,524.042604,False,0.0,claude-sonnet-4-20250514,large-scale-text-editing,524.042604,False,0.6,False,524.042604 +54bd1fa0-9614-4a84-b82f-ef1c01f98a93,claude-opus-4-1-20250805,anthropic,run-pdp11-code,2267,1256,3523,1013.398577,False,0.0,claude-opus-4-1-20250805,run-pdp11-code,1013.398577,False,0.0,False,1013.398577 +f3a9382a-a286-4120-8504-083298757995,gemini-2.5-flash,gemini,winning-avg-corewars,19223,28384,47607,3639.669892,False,0.0,gemini-2.5-flash,winning-avg-corewars,3639.669892,False,0.0,False,3639.669892 +3458662c-4385-409d-9a49-9954dba94727,deepseek-ai/DeepSeek-V3.1,together_ai,winning-avg-corewars,9630,8946,18576,1545.868203,False,0.0,deepseek-ai/DeepSeek-V3.1,winning-avg-corewars,1545.868203,False,0.0,False,1545.868203 +0808b141-e692-4b10-9099-1a0756b10bc7,gemini-2.5-pro,gemini,hf-model-inference,4045,1522,5567,385.675959,True,1.0,gemini-2.5-pro,hf-model-inference,385.675959,True,0.8,True,385.675959 +dd474613-0f9d-4aa0-984a-667e63e3b148,zai-org/GLM-4.5-Air-FP8,together_ai,winning-avg-corewars,15953,16153,32106,1501.310929,False,0.0,zai-org/GLM-4.5-Air-FP8,winning-avg-corewars,1501.310929,False,0.0,False,1501.310929 +020e26d5-5dd5-4e82-b247-f6d67bc995e6,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-db-truncate,3144,3754,6898,99.004713,False,0.0,zai-org/GLM-4.5-Air-FP8,sqlite-db-truncate,99.004713,False,0.0,False,99.004713 +c2e8bfaa-e950-4939-ad1c-2c8c99e94b42,grok-4-0709,xai,count-dataset-tokens,13333,3965,17298,900.553353,False,0.0,grok-4-0709,count-dataset-tokens,900.553353,False,0.0,False,900.553353 +681bc96d-2a38-4a72-bd84-f95c3729ebfb,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-rust-c,6350,8251,14601,906.801652,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-rust-c,906.801652,False,0.0,False,906.801652 +d7fe02c2-1891-46db-97cd-a17e9c05026f,zai-org/GLM-4.5-Air-FP8,together_ai,nginx-request-logging,7611,5711,13322,582.483279,True,1.0,zai-org/GLM-4.5-Air-FP8,nginx-request-logging,582.483279,True,1.0,True,582.483279 +d70d915e-a962-4b22-a008-67afe232d46d,claude-opus-4-1-20250805,anthropic,fix-git,2712,1749,4461,235.71115,True,1.0,claude-opus-4-1-20250805,fix-git,235.71115,True,1.0,True,235.71115 +dd6e062f-d678-4c50-8914-f8593e4bd2ad,gemini-2.5-pro,gemini,log-summary-date-ranges,7224,1642,8866,293.474978,False,0.0,gemini-2.5-pro,log-summary-date-ranges,293.474978,False,0.0,False,293.474978 +6ab64a24-d963-4053-8f17-ffc44ae48c97,claude-opus-4-1-20250805,anthropic,fix-ocaml-gc,46048,22988,69036,2913.531335,True,1.0,claude-opus-4-1-20250805,fix-ocaml-gc,2913.531335,True,0.5,True,2913.531335 +2659e60e-61c7-4b01-802f-d2b94ee8623a,openai/gpt-oss-120b,together_ai,pytorch-model-cli,1221,978,2199,126.826242,False,0.0,openai/gpt-oss-120b,pytorch-model-cli,126.826242,False,0.0,False,126.826242 +7862f772-f0c0-4cd6-bc2a-8c572d18a41a,gemini-2.5-pro,gemini,vulnerable-secret,7030,3243,10273,649.110238,True,1.0,gemini-2.5-pro,vulnerable-secret,649.110238,True,0.8,True,649.110238 +437f079f-caf5-48c8-95b1-89039ff6c5c9,OpenAI/gpt-oss-20B,together_ai,build-pmars,387,1254,1641,235.343206,False,0.0,OpenAI/gpt-oss-20B,build-pmars,235.343206,False,0.0,False,235.343206 +2bc1a810-2c1f-40a9-9364-d2ee01dd1109,claude-sonnet-4-20250514,anthropic,model-extraction-relu-logits,5181,4856,10037,524.281566,False,0.0,claude-sonnet-4-20250514,model-extraction-relu-logits,524.281566,False,0.0,False,524.281566 +1c80a047-a419-419c-91be-b157b0827062,gemini-2.5-pro,gemini,regex-log,1414,597,2011,141.182113,True,1.0,gemini-2.5-pro,regex-log,141.182113,True,0.8,True,141.182113 +3634b51d-f88c-4f37-b842-8249692cb8c7,gemini-2.5-flash,gemini,large-scale-text-editing,2310,1303,3613,243.565163,False,0.0,gemini-2.5-flash,large-scale-text-editing,243.565163,False,0.0,False,243.565163 +4d8626aa-b16a-4b73-9396-2a78c86263c7,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-retrieve,2329,1275,3604,85.97783,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-retrieve,85.97783,False,0.0,False,85.97783 +419dd4c2-415e-45ee-a15e-dc05469f9c72,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-recovery,16939,17813,34752,914.39971,False,0.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-recovery,914.39971,False,0.6,False,914.39971 +97d75b2a-29f8-4ef3-8335-d46a62c03d36,gpt-5-nano,openai,fix-git,4779,3415,8194,900.000949,False,0.0,gpt-5-nano,fix-git,900.000949,False,0.0,False,900.000949 +2ecbb0d2-527c-416d-80a3-a40bb6710cf5,gpt-5,openai,fix-code-vulnerability,5132,7192,12324,902.279823,False,0.0,gpt-5,fix-code-vulnerability,902.279823,False,0.0,False,902.279823 +108bcdc9-f2bb-4c9b-ad1a-3d92c097462d,deepseek-ai/DeepSeek-V3.1,together_ai,count-dataset-tokens,17154,4401,21555,794.54257,False,0.0,deepseek-ai/DeepSeek-V3.1,count-dataset-tokens,794.54257,False,0.0,False,794.54257 +3bf026a8-8878-4aac-8a89-18ece7b0e54f,deepseek-ai/DeepSeek-V3.1,together_ai,bn-fit-modify,15461,7328,22789,1015.560609,False,0.0,deepseek-ai/DeepSeek-V3.1,bn-fit-modify,1015.560609,False,0.0,False,1015.560609 +d2f56d4a-6033-4142-9262-4f6b7063741e,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-differential-cryptanalysis,26883,30179,57062,1808.40788,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-differential-cryptanalysis,1808.40788,False,0.0,False,1808.40788 +52a24d4b-ba84-4f45-b2b7-b5b4c758e82a,zai-org/GLM-4.5-Air-FP8,together_ai,sparql-university,5634,2845,8479,220.562767,False,0.0,zai-org/GLM-4.5-Air-FP8,sparql-university,220.562767,False,0.0,False,220.562767 +775a18bc-c52a-4805-88b1-c0c10191a837,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-rust-c,4296,3098,7394,340.353375,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-rust-c,340.353375,False,0.0,False,340.353375 +39990a66-0bef-416f-ba42-7e832383a32a,gemini-2.5-pro,gemini,git-leak-recovery,2132,1550,3682,161.396977,True,1.0,gemini-2.5-pro,git-leak-recovery,161.396977,True,1.0,True,161.396977 +aec6612e-395b-4562-b6b0-654398923805,grok-code-fast-1,xai,adaptive-rejection-sampler,7485,6473,13958,488.475857,False,0.0,grok-code-fast-1,adaptive-rejection-sampler,488.475857,False,0.0,False,488.475857 +9ea1759f-a0f0-4248-9bcf-110e46e1d0e4,gpt-5-nano,openai,tune-mjcf,6763,8397,15160,995.823158,False,0.0,gpt-5-nano,tune-mjcf,995.823158,False,0.0,False,995.823158 +ced38a76-1968-480c-9637-281d55b77a49,gpt-5-nano,openai,schemelike-metacircular-eval,17532,22872,40404,2464.685159,True,1.0,gpt-5-nano,schemelike-metacircular-eval,2464.685159,True,0.2,True,2464.685159 +3171e92f-94fd-48e4-aafa-a31948aac168,claude-opus-4-1-20250805,anthropic,code-from-image,22779,16068,38847,747.059007,True,1.0,claude-opus-4-1-20250805,code-from-image,747.059007,True,0.125,True,747.059007 +d8520981-e0c1-43c5-9d82-cd2d002215b5,grok-code-fast-1,xai,nginx-request-logging,3663,1288,4951,78.433008,False,0.0,grok-code-fast-1,nginx-request-logging,78.433008,False,0.0,False,78.433008 +79944840-cfee-4e24-adb3-640e801c0be5,gpt-5-mini,openai,form-filling,5043,3717,8760,183.801511,True,1.0,gpt-5-mini,form-filling,183.801511,True,1.0,True,183.801511 +1f79a6b8-e72d-48d1-be74-f0fae5d6c03e,gpt-5-mini,openai,train-fasttext,19155,15457,34612,3648.149359,False,0.0,gpt-5-mini,train-fasttext,3648.149359,False,0.0,False,3648.149359 +0af2ceb3-da0d-4bf3-b889-dc7456542ec5,claude-sonnet-4-20250514,anthropic,pypi-server,6112,4406,10518,408.477541,True,1.0,claude-sonnet-4-20250514,pypi-server,408.477541,True,0.8,True,408.477541 +81dd5a03-18a1-47be-b176-b2ecb592c3a5,zai-org/GLM-4.5-Air-FP8,together_ai,build-initramfs-qemu,2371,2530,4901,85.91385,False,0.0,zai-org/GLM-4.5-Air-FP8,build-initramfs-qemu,85.91385,False,0.0,False,85.91385 +c2f1bbe8-98b5-42ce-acdb-7eaec0fe27f3,gemini-2.5-pro,gemini,openssl-selfsigned-cert,3029,1706,4735,148.691059,False,0.0,gemini-2.5-pro,openssl-selfsigned-cert,148.691059,False,0.6,False,148.691059 +106ed985-8563-417a-8917-f243f52bcc20,gpt-5-mini,openai,polyglot-c-py,3289,2652,5941,317.484834,False,0.0,gpt-5-mini,polyglot-c-py,317.484834,False,0.0,False,317.484834 +1059aecd-1da1-4806-939d-0f77a64f4e01,gpt-5,openai,qemu-alpine-ssh,1705,967,2672,290.37141,True,1.0,gpt-5,qemu-alpine-ssh,290.37141,True,0.1666666666666666,True,290.37141 +48faaa54-371a-4539-aa39-cbf013c15275,grok-code-fast-1,xai,regex-log,1300,697,1997,78.786385,False,0.0,grok-code-fast-1,regex-log,78.786385,False,0.0,False,78.786385 +cd84fb75-892a-4d65-9084-02c337b9a4e2,grok-code-fast-1,xai,sparql-university,5013,1702,6715,84.458351,True,1.0,grok-code-fast-1,sparql-university,84.458351,True,0.2,True,84.458351 +1bf00f9f-1834-47f5-9cd5-43823df894f9,deepseek-ai/DeepSeek-V3.1,together_ai,tune-mjcf,9379,7268,16647,939.710948,False,0.0,deepseek-ai/DeepSeek-V3.1,tune-mjcf,939.710948,False,0.0,False,939.710948 +dc9de74b-2e17-482f-b32c-8a86c54a3501,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-recovery,15625,10683,26308,817.002718,True,1.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-recovery,817.002718,True,0.4,True,817.002718 +e56b5895-7bc5-4aba-9b33-78c32c3514b6,deepseek-ai/DeepSeek-V3.1,together_ai,distribution-search,12599,11999,24598,1247.073547,False,0.0,deepseek-ai/DeepSeek-V3.1,distribution-search,1247.073547,False,0.0,False,1247.073547 +c0f0649a-6e76-490f-b918-14e908dac67f,deepseek-ai/DeepSeek-V3.1,together_ai,dna-assembly,7884,3118,11002,249.394607,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-assembly,249.394607,False,0.0,False,249.394607 +01b0549b-ac54-41f2-bc1d-9c4b9dbb6d60,gemini-2.5-pro,gemini,cancel-async-tasks,1576,1380,2956,170.05352,False,0.0,gemini-2.5-pro,cancel-async-tasks,170.05352,False,0.0,False,170.05352 +aacdbe1d-b4ca-49b1-93e3-ab27e5dba1c1,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,chess-best-move,16594,7080,23674,820.276921,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,chess-best-move,820.276921,False,0.0,False,820.276921 +2e2bbce6-92ad-40fc-afd3-6c8d99e937bd,gemini-2.5-flash,gemini,cancel-async-tasks,2348,3104,5452,684.612171,False,0.0,gemini-2.5-flash,cancel-async-tasks,684.612171,False,0.2,False,684.612171 +b24625f3-3305-496d-9200-0b7071eaf2c5,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,crack-7z-hash,6486,3916,10402,459.921733,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,crack-7z-hash,459.921733,False,0.0,False,459.921733 +6ab32e2a-c3d4-447b-ac01-11ab0712d5f0,OpenAI/gpt-oss-20B,together_ai,large-scale-text-editing,1245,1240,2485,51.851568,False,0.0,OpenAI/gpt-oss-20B,large-scale-text-editing,51.851568,False,0.0,False,51.851568 +b35b8bcf-1cd9-44f8-9f2c-ae9cc35c67c0,moonshotai/Kimi-K2-Instruct-0905,together_ai,extract-elf,14649,4839,19488,559.724871,True,1.0,moonshotai/Kimi-K2-Instruct-0905,extract-elf,559.724871,True,0.6,True,559.724871 +a548e08d-8e9f-4998-8722-3e2b6f47afdc,zai-org/GLM-4.5-Air-FP8,together_ai,chess-best-move,13672,8668,22340,509.512858,False,0.0,zai-org/GLM-4.5-Air-FP8,chess-best-move,509.512858,False,0.0,False,509.512858 +ed7d62ec-44eb-4d38-a95d-8742047dab90,claude-sonnet-4-20250514,anthropic,large-scale-text-editing,5838,5677,11515,1200.031628,False,0.0,claude-sonnet-4-20250514,large-scale-text-editing,1200.031628,False,0.6,False,1200.031628 +a7ca0d02-2ecb-45c1-b9d9-088ebeed125d,grok-4-0709,xai,polyglot-rust-c,0,0,0,900.176969,False,0.0,grok-4-0709,polyglot-rust-c,900.176969,False,0.0,False,900.176969 +9c813aee-a81d-4e90-8df8-f61b2dd81087,deepseek-ai/DeepSeek-V3.1,together_ai,extract-elf,6638,1428,8066,245.552533,False,0.0,deepseek-ai/DeepSeek-V3.1,extract-elf,245.552533,False,0.6,False,245.552533 +c788a979-4c22-4679-9638-433a205d9b27,zai-org/GLM-4.5-Air-FP8,together_ai,feal-linear-cryptanalysis,17714,18534,36248,1822.693658,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-linear-cryptanalysis,1822.693658,False,0.0,False,1822.693658 +852515e7-ae0c-45f5-92cc-064f9907e77f,claude-sonnet-4-20250514,anthropic,feal-differential-cryptanalysis,27626,28649,56275,1807.219773,False,0.0,claude-sonnet-4-20250514,feal-differential-cryptanalysis,1807.219773,False,0.0,False,1807.219773 +2273405c-10d4-475c-a5de-f1815d335cd3,gpt-5,openai,configure-git-webserver,5084,1972,7056,145.150595,True,1.0,gpt-5,configure-git-webserver,145.150595,True,1.0,True,145.150595 +7a042abc-c91d-4be6-8d68-339839b1af36,claude-opus-4-1-20250805,anthropic,video-processing,3281,2986,6267,90.555214,False,0.0,claude-opus-4-1-20250805,video-processing,90.555214,False,0.0,False,90.555214 +da36dc85-145e-40a8-aa8c-ca018763c3e4,gpt-5,openai,distribution-search,2893,2128,5021,327.497215,True,1.0,gpt-5,distribution-search,327.497215,True,1.0,True,327.497215 +998fe7e9-864b-4b9a-a5cc-fb570d96ea14,gemini-2.5-flash,gemini,form-filling,14332,11013,25345,912.370358,False,0.0,gemini-2.5-flash,form-filling,912.370358,False,0.0,False,912.370358 +29814007-ef14-4d68-a6ca-6420a13b67c0,gpt-5,openai,pytorch-model-cli,2164,1966,4130,149.855489,False,0.0,gpt-5,pytorch-model-cli,149.855489,False,0.0,False,149.855489 +d6667947-704b-4737-b0d3-9ea5e623a4b3,gemini-2.5-pro,gemini,build-pmars,7860,2432,10292,224.835783,True,1.0,gemini-2.5-pro,build-pmars,224.835783,True,1.0,True,224.835783 +cc7195b5-5151-42d3-ae73-74e475f5a503,grok-4-0709,xai,reverse-engineering,10120,4225,14345,1802.557031,False,0.0,grok-4-0709,reverse-engineering,1802.557031,False,0.2,False,1802.557031 +190922b4-bc91-4467-aa14-ea3264e1a6b8,zai-org/GLM-4.5-Air-FP8,together_ai,reshard-c4-data,7828,4767,12595,268.393214,False,0.0,zai-org/GLM-4.5-Air-FP8,reshard-c4-data,268.393214,False,0.0,False,268.393214 +4b071e58-8132-4351-ac84-74de9436119f,OpenAI/gpt-oss-20B,together_ai,feal-differential-cryptanalysis,330,1237,1567,65.323061,False,0.0,OpenAI/gpt-oss-20B,feal-differential-cryptanalysis,65.323061,False,0.0,False,65.323061 +34fdaf91-a5c2-4665-b2e2-4ccdc1bdb96b,gpt-5-nano,openai,log-summary-date-ranges,2389,1893,4282,210.414753,False,0.0,gpt-5-nano,log-summary-date-ranges,210.414753,False,0.0,False,210.414753 +a39e4c84-ce1a-4423-98a8-c935982a9dc9,grok-code-fast-1,xai,cobol-modernization,4625,2597,7222,775.841924,False,0.0,grok-code-fast-1,cobol-modernization,775.841924,False,0.6,False,775.841924 +5f47255a-e9ee-4db6-aced-a38e5ed437f6,grok-code-fast-1,xai,pytorch-model-recovery,11220,7866,19086,388.586555,True,1.0,grok-code-fast-1,pytorch-model-recovery,388.586555,True,0.8,True,388.586555 +898e20a2-2f30-4d3b-beb3-f855059c4a42,OpenAI/gpt-oss-20B,together_ai,sqlite-with-gcov,1304,808,2112,164.473224,False,0.0,OpenAI/gpt-oss-20B,sqlite-with-gcov,164.473224,False,0.0,False,164.473224 +44ab5543-e9e8-4f62-9ee1-b33c1d394ca9,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-cython-ext,20640,4384,25024,900.881575,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-cython-ext,900.881575,False,0.0,False,900.881575 +da1e135a-1f9b-43f3-b01a-3c48f74205cd,grok-4-0709,xai,write-compressor,1375,579,1954,904.310914,False,0.0,grok-4-0709,write-compressor,904.310914,False,0.0,False,904.310914 +4657c8d9-2d07-41fb-a682-0077dd737d78,grok-code-fast-1,xai,gpt2-codegolf,1249,785,2034,44.607847,False,0.0,grok-code-fast-1,gpt2-codegolf,44.607847,False,0.0,False,44.607847 +f5ea7123-b733-4901-94b6-d72e3799f09c,gpt-5,openai,write-compressor,8855,5539,14394,707.465168,True,1.0,gpt-5,write-compressor,707.465168,True,0.3333333333333333,True,707.465168 +f9abff12-4f9a-4bd6-8f18-523bff9e1f91,claude-opus-4-1-20250805,anthropic,pytorch-model-recovery,12164,10426,22590,900.001341,True,1.0,claude-opus-4-1-20250805,pytorch-model-recovery,900.001341,True,1.0,True,900.001341 +551d0d50-197f-4fe0-845c-7b48626119b1,moonshotai/Kimi-K2-Instruct-0905,together_ai,tune-mjcf,6995,5906,12901,589.374911,True,1.0,moonshotai/Kimi-K2-Instruct-0905,tune-mjcf,589.374911,True,0.4,True,589.374911 +2e2adf0f-ee9f-4f3c-b1c3-fff4213ae2dd,claude-opus-4-1-20250805,anthropic,install-klee-minimal,15296,2547,17843,901.186887,False,0.0,claude-opus-4-1-20250805,install-klee-minimal,901.186887,False,0.0,False,901.186887 +5d6f69e5-d438-4655-96de-eb06766de45b,grok-code-fast-1,xai,vulnerable-secret,9973,3323,13296,901.137682,False,0.0,grok-code-fast-1,vulnerable-secret,901.137682,False,0.6,False,901.137682 +5ac7e773-e660-424d-815e-dcdede114691,gpt-5-mini,openai,adaptive-rejection-sampler,3217,12530,15747,946.678663,False,0.0,gpt-5-mini,adaptive-rejection-sampler,946.678663,False,0.4,False,946.678663 +c9511fbf-837e-44cf-98ef-e01227d81b1f,gemini-2.5-flash,gemini,feal-differential-cryptanalysis,2495,2789,5284,335.795619,True,1.0,gemini-2.5-flash,feal-differential-cryptanalysis,335.795619,True,0.2,True,335.795619 +2e1d3012-18d7-4b49-93c9-b35f1ffe3518,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-startup,1832,1990,3822,1012.517922,False,0.0,moonshotai/Kimi-K2-Instruct-0905,qemu-startup,1012.517922,False,0.4,False,1012.517922 +a9104fa7-3fa9-422d-8f9a-af735310996c,gpt-5,openai,count-dataset-tokens,8079,5929,14008,516.552996,False,0.0,gpt-5,count-dataset-tokens,516.552996,False,0.1666666666666666,False,516.552996 +db0686cb-5e8b-4af6-b897-5b4d540288e5,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-rust-c,15389,17300,32689,910.165354,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-rust-c,910.165354,False,0.0,False,910.165354 +33e66ecc-3e50-460d-ab42-eba27e76550e,claude-sonnet-4-20250514,anthropic,path-tracing,6583,6127,12710,501.448726,False,0.0,claude-sonnet-4-20250514,path-tracing,501.448726,False,0.0,False,501.448726 +f284a38b-f6a0-4af8-a2e1-77982f8da90d,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-startup,670,2064,2734,906.872479,False,0.0,zai-org/GLM-4.5-Air-FP8,qemu-startup,906.872479,False,0.2,False,906.872479 +b9080d52-635b-47fd-8ad4-2f2847029136,deepseek-ai/DeepSeek-V3.1,together_ai,chess-best-move,11007,3025,14032,422.05488,False,0.0,deepseek-ai/DeepSeek-V3.1,chess-best-move,422.05488,False,0.0,False,422.05488 +696069f5-30cb-4cec-a4a2-4c8e8658bd45,grok-4-0709,xai,bn-fit-modify,19455,10273,29728,2622.69476,False,0.0,grok-4-0709,bn-fit-modify,2622.69476,False,0.6,False,2622.69476 +52a07a4d-fcb0-41b0-8435-cfc29f2a0666,gpt-5-mini,openai,distribution-search,20398,17347,37745,1429.156094,True,1.0,gpt-5-mini,distribution-search,1429.156094,True,1.0,True,1429.156094 +ff51f94c-37d8-43ba-8c47-df32a70b6048,gpt-5-mini,openai,path-tracing,12700,7290,19990,853.573439,False,0.0,gpt-5-mini,path-tracing,853.573439,False,0.0,False,853.573439 +798bee1c-abcc-48de-a764-383c2b54fc1a,grok-4-0709,xai,bn-fit-modify,25641,7312,32953,2074.064092,True,1.0,grok-4-0709,bn-fit-modify,2074.064092,True,0.6,True,2074.064092 +62f72753-02e1-47af-86e8-bd5c5d7e673f,claude-sonnet-4-20250514,anthropic,gpt2-codegolf,8796,9240,18036,727.244777,False,0.0,claude-sonnet-4-20250514,gpt2-codegolf,727.244777,False,0.0,False,727.244777 +b7c4e7b1-a7ef-4e4a-ad61-abf3c9d88c8e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-linear-cryptanalysis,15519,14152,29671,1836.86963,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-linear-cryptanalysis,1836.86963,False,0.0,False,1836.86963 +82f712df-a525-482b-9571-4d0058cadbb4,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-rust-c,14403,15192,29595,900.001404,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-rust-c,900.001404,False,0.0,False,900.001404 +b8c86452-c159-4f72-9021-5620fb5877fc,OpenAI/gpt-oss-20B,together_ai,large-scale-text-editing,516,2973,3489,218.138787,False,0.0,OpenAI/gpt-oss-20B,large-scale-text-editing,218.138787,False,0.0,False,218.138787 +94863fd0-50ce-4be6-894a-eb0d0256c2e0,zai-org/GLM-4.5-Air-FP8,together_ai,model-extraction-relu-logits,2019,2216,4235,140.90876,False,0.0,zai-org/GLM-4.5-Air-FP8,model-extraction-relu-logits,140.90876,False,0.2,False,140.90876 +d60e7b89-5170-4140-8897-2d9462402455,gpt-5,openai,count-dataset-tokens,5905,4603,10508,663.083849,True,1.0,gpt-5,count-dataset-tokens,663.083849,True,0.1666666666666666,True,663.083849 +fc133464-aad8-47d1-a846-b7b52278b7f7,moonshotai/Kimi-K2-Instruct-0905,together_ai,winning-avg-corewars,13350,11435,24785,2741.376983,False,0.0,moonshotai/Kimi-K2-Instruct-0905,winning-avg-corewars,2741.376983,False,0.0,False,2741.376983 +9c57bd96-8700-4ff8-9b58-3999eb0b95c3,OpenAI/gpt-oss-20B,together_ai,count-dataset-tokens,1596,5153,6749,914.908032,False,0.0,OpenAI/gpt-oss-20B,count-dataset-tokens,914.908032,False,0.0,False,914.908032 +f56cf574-254b-454d-86db-ac4381a25790,grok-4-0709,xai,largest-eigenval,5390,4084,9474,901.437261,False,0.0,grok-4-0709,largest-eigenval,901.437261,False,0.0,False,901.437261 +5e56ea48-a2e9-4ff3-a960-1ad4d38b53b7,gpt-5-mini,openai,distribution-search,26325,23588,49913,2123.276968,True,1.0,gpt-5-mini,distribution-search,2123.276968,True,1.0,True,2123.276968 +c935f7f6-6819-4116-a924-6ff5558d5ee0,gpt-5,openai,hf-model-inference,3786,1780,5566,170.313113,True,1.0,gpt-5,hf-model-inference,170.313113,True,1.0,True,170.313113 +58028152-1114-4c65-9ee9-18a6f8605195,gpt-5-mini,openai,feal-differential-cryptanalysis,5318,3755,9073,354.333943,False,0.0,gpt-5-mini,feal-differential-cryptanalysis,354.333943,False,0.0,False,354.333943 +d8cc0b61-15c9-42ec-bebf-f4ef420826f2,zai-org/GLM-4.5-Air-FP8,together_ai,count-dataset-tokens,15030,5231,20261,905.280255,False,0.0,zai-org/GLM-4.5-Air-FP8,count-dataset-tokens,905.280255,False,0.0,False,905.280255 +bbbac5dd-e18f-4881-9561-68e14c072e9c,gpt-5,openai,fix-ocaml-gc,17842,14127,31969,3600.019834,False,0.0,gpt-5,fix-ocaml-gc,3600.019834,False,0.0,False,3600.019834 +02188842-7988-46c0-9b17-aa49ad59b165,gpt-5-nano,openai,merge-diff-arc-agi-task,10871,6680,17551,454.908975,True,1.0,gpt-5-nano,merge-diff-arc-agi-task,454.908975,True,0.2,True,454.908975 +98742de8-4277-4360-a635-3637adc1e4f1,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,form-filling,3081,2065,5146,211.917987,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,form-filling,211.917987,False,0.0,False,211.917987 +62edb066-bb81-4e37-8f28-c90baefc7b23,deepseek-ai/DeepSeek-V3.1,together_ai,port-compressor,55698,41458,97156,3605.12597,False,0.0,deepseek-ai/DeepSeek-V3.1,port-compressor,3605.12597,False,0.0,False,3605.12597 +20aabab7-1d52-463e-9ced-3c5ba07deedc,zai-org/GLM-4.5-Air-FP8,together_ai,pypi-server,4896,3555,8451,436.588969,False,0.0,zai-org/GLM-4.5-Air-FP8,pypi-server,436.588969,False,0.2,False,436.588969 +115fe85d-e11d-4e77-8ee0-bcf687ab1799,moonshotai/Kimi-K2-Instruct-0905,together_ai,sanitize-git-repo,9183,4399,13582,656.610933,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sanitize-git-repo,656.610933,False,0.0,False,656.610933 +55680f76-afa8-44ed-9c35-8450c50286fd,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-code-vulnerability,14670,7936,22606,930.576183,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-code-vulnerability,930.576183,False,0.0,False,930.576183 +0d5a2add-a3a9-4d77-9cdd-1ba8a2903d3d,zai-org/GLM-4.5-Air-FP8,together_ai,circuit-fibsqrt,22605,26915,49520,1501.638539,False,0.0,zai-org/GLM-4.5-Air-FP8,circuit-fibsqrt,1501.638539,False,0.0,False,1501.638539 +6fe11f90-0267-4a81-84ff-10eb804a4884,openai/gpt-oss-120b,together_ai,reverse-engineering,10409,22058,32467,1804.178101,False,0.0,openai/gpt-oss-120b,reverse-engineering,1804.178101,False,0.2,False,1804.178101 +d4dde4c0-53e0-475a-86b2-d0c815c56884,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-insert,6861,2900,9761,360.416892,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-insert,360.416892,False,0.0,False,360.416892 +40616c3c-a933-455c-891e-71a20c379e9c,zai-org/GLM-4.5-Air-FP8,together_ai,configure-git-webserver,12824,7838,20662,788.794964,False,0.0,zai-org/GLM-4.5-Air-FP8,configure-git-webserver,788.794964,False,0.0,False,788.794964 +a628caf2-3b24-4267-b396-6224b0ea28fb,claude-opus-4-1-20250805,anthropic,build-pov-ray,16027,6103,22130,600.042798,True,1.0,claude-opus-4-1-20250805,build-pov-ray,600.042798,True,0.75,True,600.042798 +70a1c023-8126-49a3-938d-7cea810588fe,grok-code-fast-1,xai,feal-linear-cryptanalysis,10865,7181,18046,631.881206,False,0.0,grok-code-fast-1,feal-linear-cryptanalysis,631.881206,False,0.0,False,631.881206 +4aa13201-97bd-4e63-8fa8-e76e4fc039c4,gpt-5,openai,sqlite-db-truncate,6863,4706,11569,533.71273,False,0.0,gpt-5,sqlite-db-truncate,533.71273,False,0.0,False,533.71273 +301a20c7-1438-4568-ba66-aff2c1f19fac,grok-code-fast-1,xai,video-processing,2440,1745,4185,84.751585,False,0.0,grok-code-fast-1,video-processing,84.751585,False,0.0,False,84.751585 +ce45e7da-75b8-479a-905b-d50c058073b7,gemini-2.5-pro,gemini,gpt2-codegolf,5871,8537,14408,925.61234,False,0.0,gemini-2.5-pro,gpt2-codegolf,925.61234,False,0.0,False,925.61234 +30c39365-b589-4068-a684-50617e917c37,zai-org/GLM-4.5-Air-FP8,together_ai,chess-best-move,13533,4303,17836,632.160736,False,0.0,zai-org/GLM-4.5-Air-FP8,chess-best-move,632.160736,False,0.0,False,632.160736 +3efd40f7-5f58-4f53-a526-6ecc65feed68,claude-opus-4-1-20250805,anthropic,large-scale-text-editing,5127,5639,10766,669.653332,True,1.0,claude-opus-4-1-20250805,large-scale-text-editing,669.653332,True,0.6666666666666666,True,669.653332 +675fa499-2e18-4af8-85dd-0ce2f4a0ad59,gemini-2.5-pro,gemini,wasm-pipeline,14488,4878,19366,921.189737,False,0.0,gemini-2.5-pro,wasm-pipeline,921.189737,False,0.0,False,921.189737 +ac7e5321-4a79-4c78-9fd4-fff9eaba21ba,gemini-2.5-pro,gemini,qemu-alpine-ssh,1923,1699,3622,227.564224,False,0.0,gemini-2.5-pro,qemu-alpine-ssh,227.564224,False,0.2,False,227.564224 +7ebb4290-803f-486c-b928-6409d9dc417d,deepseek-ai/DeepSeek-V3.1,together_ai,openssl-selfsigned-cert,4206,2743,6949,298.786631,True,1.0,deepseek-ai/DeepSeek-V3.1,openssl-selfsigned-cert,298.786631,True,1.0,True,298.786631 +c80b612e-c453-4a90-a539-431647251b3c,openai/gpt-oss-120b,together_ai,dna-assembly,8911,10395,19306,737.300847,False,0.0,openai/gpt-oss-120b,dna-assembly,737.300847,False,0.0,False,737.300847 +45b4f001-68c4-4ba2-a015-e81dd85d9ed3,gpt-5-mini,openai,write-compressor,2992,1437,4429,272.563807,False,0.0,gpt-5-mini,write-compressor,272.563807,False,0.0,False,272.563807 +d1d93f71-5f04-4bae-85c4-47e76b49270e,grok-code-fast-1,xai,tune-mjcf,7203,6312,13515,946.07418,False,0.0,grok-code-fast-1,tune-mjcf,946.07418,False,0.4,False,946.07418 +98c24cda-934d-4b66-8665-73d09202625b,grok-code-fast-1,xai,constraints-scheduling,3419,2296,5715,457.227131,True,1.0,grok-code-fast-1,constraints-scheduling,457.227131,True,0.8,True,457.227131 +8fba36f8-264b-48fa-b22c-5b693fe44c36,gpt-5,openai,feal-differential-cryptanalysis,2595,1213,3808,527.229762,False,0.0,gpt-5,feal-differential-cryptanalysis,527.229762,False,0.0,False,527.229762 +19d5dad0-86e9-4835-8099-667c6757bef3,gpt-5-mini,openai,chess-best-move,18950,12854,31804,805.153257,False,0.0,gpt-5-mini,chess-best-move,805.153257,False,0.0,False,805.153257 +a1bd368b-70f4-437b-8205-5f04f11eefa4,deepseek-ai/DeepSeek-V3.1,together_ai,sanitize-git-repo,13936,2304,16240,259.682539,False,0.0,deepseek-ai/DeepSeek-V3.1,sanitize-git-repo,259.682539,False,0.0,False,259.682539 +b3461fee-2a1a-4539-b33b-5027e4ab3c9f,claude-opus-4-1-20250805,anthropic,tune-mjcf,9924,7885,17809,907.472763,False,0.0,claude-opus-4-1-20250805,tune-mjcf,907.472763,False,0.25,False,907.472763 +83013d73-49df-4065-9bd3-3ffc1642e4dd,moonshotai/Kimi-K2-Instruct-0905,together_ai,model-extraction-relu-logits,13207,7048,20255,529.043405,False,0.0,moonshotai/Kimi-K2-Instruct-0905,model-extraction-relu-logits,529.043405,False,0.4,False,529.043405 +b2788058-e06c-4526-b055-4998d1f9ae33,gemini-2.5-flash,gemini,large-scale-text-editing,1878,1945,3823,352.885575,False,0.0,gemini-2.5-flash,large-scale-text-editing,352.885575,False,0.0,False,352.885575 +39245809-5dc6-43dc-8f46-22354480c47c,gpt-5-nano,openai,password-recovery,2306,5380,7686,900.719173,False,0.0,gpt-5-nano,password-recovery,900.719173,False,0.0,False,900.719173 +568fdf21-3941-49db-b68c-3196a84d4a05,gpt-5,openai,large-scale-text-editing,6540,1656,8196,164.122586,True,1.0,gpt-5,large-scale-text-editing,164.122586,True,0.4285714285714285,True,164.122586 +8dca7f3b-0e4f-4fef-b804-f6961fbd70a1,gemini-2.5-flash,gemini,qemu-startup,1381,1343,2724,164.075666,False,0.0,gemini-2.5-flash,qemu-startup,164.075666,False,0.2,False,164.075666 +d04c0a1b-f507-48a2-b04a-449174b0d17b,grok-4-0709,xai,fix-git,2038,1867,3905,355.122256,True,1.0,grok-4-0709,fix-git,355.122256,True,1.0,True,355.122256 +81455380-ab27-40c8-95c0-5119d8b0a9b6,openai/gpt-oss-120b,together_ai,schemelike-metacircular-eval,7100,3041,10141,284.288081,False,0.0,openai/gpt-oss-120b,schemelike-metacircular-eval,284.288081,False,0.0,False,284.288081 +df251c62-6bce-4c8b-9655-df615dd1a2f4,OpenAI/gpt-oss-20B,together_ai,model-extraction-relu-logits,168,972,1140,101.382685,False,0.0,OpenAI/gpt-oss-20B,model-extraction-relu-logits,101.382685,False,0.0,False,101.382685 +f6444afd-b425-49c9-a9b0-fa3b8ef2211c,grok-code-fast-1,xai,regex-log,1336,671,2007,113.024727,False,0.0,grok-code-fast-1,regex-log,113.024727,False,0.0,False,113.024727 +faeeb025-41d2-4ea6-8445-0fe223b4bc41,openai/gpt-oss-120b,together_ai,adaptive-rejection-sampler,4845,4009,8854,530.766233,False,0.0,openai/gpt-oss-120b,adaptive-rejection-sampler,530.766233,False,0.0,False,530.766233 +06b36570-1863-4146-99f7-f761290703de,zai-org/GLM-4.5-Air-FP8,together_ai,install-klee-minimal,7251,1456,8707,903.034776,False,0.0,zai-org/GLM-4.5-Air-FP8,install-klee-minimal,903.034776,False,0.0,False,903.034776 +264f3b92-533b-43c2-af22-c2b5891928b6,gpt-5,openai,db-wal-recovery,9970,7037,17007,585.510196,False,0.0,gpt-5,db-wal-recovery,585.510196,False,0.1428571428571428,False,585.510196 +2674f06e-ffdf-4000-99d0-9e9e16f77d94,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,db-wal-recovery,1805,1073,2878,245.734725,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,db-wal-recovery,245.734725,False,0.0,False,245.734725 +f3f3304f-7e65-4bfd-8f58-cf6c88a4e9f0,gpt-5,openai,path-tracing-reverse,13980,5792,19772,852.630629,False,0.0,gpt-5,path-tracing-reverse,852.630629,False,0.0,False,852.630629 +5d676335-bede-4a46-940f-6577e9de7bf2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-mips-interpreter,25583,13198,38781,1518.34756,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-mips-interpreter,1518.34756,False,0.0,False,1518.34756 +61674130-ed1a-4ff1-81a9-250181621a7b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reshard-c4-data,14590,11211,25801,2067.149465,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reshard-c4-data,2067.149465,False,0.0,False,2067.149465 +74324bec-f1be-4d47-a7cc-b72993ddc0da,OpenAI/gpt-oss-20B,together_ai,build-pov-ray,168,698,866,130.354514,False,0.0,OpenAI/gpt-oss-20B,build-pov-ray,130.354514,False,0.0,False,130.354514 +d65ab5f7-7c05-4002-9c09-4d7432cbfef8,openai/gpt-oss-120b,together_ai,chess-best-move,4652,5234,9886,332.801006,False,0.0,openai/gpt-oss-120b,chess-best-move,332.801006,False,0.0,False,332.801006 +03b407d8-9886-49cc-b381-7f6043245e47,gpt-5-mini,openai,pypi-server,2784,1308,4092,245.838615,True,1.0,gpt-5-mini,pypi-server,245.838615,True,0.8,True,245.838615 +9842df1a-15f2-4b48-adde-c1283523f546,gemini-2.5-flash,gemini,break-filter-js-from-html,4174,13202,17376,1203.721666,False,0.0,gemini-2.5-flash,break-filter-js-from-html,1203.721666,False,0.0,False,1203.721666 +1a575449-6f93-48c1-873e-235602f611d3,grok-code-fast-1,xai,polyglot-rust-c,1164,719,1883,143.00186,False,0.0,grok-code-fast-1,polyglot-rust-c,143.00186,False,0.0,False,143.00186 +1919cf9a-1fd6-4bde-aaae-caaa9e851c49,gpt-5,openai,run-pdp11-code,4997,4982,9979,1007.683648,False,0.0,gpt-5,run-pdp11-code,1007.683648,False,0.0,False,1007.683648 +e0f3f922-f08a-469c-80fb-5e82048becd7,claude-sonnet-4-20250514,anthropic,fix-code-vulnerability,19933,8674,28607,902.056481,True,1.0,claude-sonnet-4-20250514,fix-code-vulnerability,902.056481,True,0.8,True,902.056481 +12d2ff45-5d78-4e93-ae43-67d218550b9a,grok-code-fast-1,xai,fix-ocaml-gc,11774,3271,15045,475.455921,False,0.0,grok-code-fast-1,fix-ocaml-gc,475.455921,False,0.0,False,475.455921 +7a3f7aa6-f66f-4cab-be1b-efa3b39425cb,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,adaptive-rejection-sampler,6098,2289,8387,443.831953,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,adaptive-rejection-sampler,443.831953,False,0.0,False,443.831953 +a1cbb638-d051-4b6e-b15e-b1bad9716260,gpt-5,openai,sparql-university,5810,2052,7862,223.38647,True,1.0,gpt-5,sparql-university,223.38647,True,0.8,True,223.38647 +7839b505-869d-4b41-a79b-30c0a67b9998,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,chess-best-move,4695,2841,7536,331.307165,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,chess-best-move,331.307165,False,0.0,False,331.307165 +970ca86b-aafb-48bd-a7ce-bc3ec4588332,gpt-5-nano,openai,hf-model-inference,12266,5786,18052,900.225072,False,0.0,gpt-5-nano,hf-model-inference,900.225072,False,0.4,False,900.225072 +311b3138-75b1-4a83-8d4d-cf258de0d3f0,claude-opus-4-1-20250805,anthropic,cobol-modernization,9877,8163,18040,240.765361,True,1.0,claude-opus-4-1-20250805,cobol-modernization,240.765361,True,0.875,True,240.765361 +fefd6259-132e-4ed0-b7a3-18a1dd449598,claude-sonnet-4-20250514,anthropic,video-processing,4773,3759,8532,242.910185,False,0.0,claude-sonnet-4-20250514,video-processing,242.910185,False,0.0,False,242.910185 +9468c801-e77b-476d-9e56-c7618c84dd59,gemini-2.5-flash,gemini,fix-git,2161,1630,3791,80.054881,True,1.0,gemini-2.5-flash,fix-git,80.054881,True,0.8,True,80.054881 +08ebdb3a-5d6f-4a70-aa50-0146188f0cc2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,filter-js-from-html,7135,7251,14386,900.464949,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,filter-js-from-html,900.464949,False,0.0,False,900.464949 +696ebfe5-84c3-4be8-a817-a71ca527e29f,gemini-2.5-flash,gemini,git-leak-recovery,2931,3715,6646,678.939516,True,1.0,gemini-2.5-flash,git-leak-recovery,678.939516,True,0.6,True,678.939516 +27d5a996-8f33-4373-ae7f-1b57de147385,grok-4-0709,xai,schemelike-metacircular-eval,7092,4084,11176,2414.199164,False,0.0,grok-4-0709,schemelike-metacircular-eval,2414.199164,False,0.0,False,2414.199164 +561d7842-83b8-4a42-b69a-65cf1e9fad86,OpenAI/gpt-oss-20B,together_ai,adaptive-rejection-sampler,1666,1645,3311,356.535976,False,0.0,OpenAI/gpt-oss-20B,adaptive-rejection-sampler,356.535976,False,0.0,False,356.535976 +022e116a-8e48-46f4-8851-16d0f4ecfd30,gpt-5-mini,openai,configure-git-webserver,4387,1400,5787,134.555983,True,1.0,gpt-5-mini,configure-git-webserver,134.555983,True,0.6,True,134.555983 +3532584f-cbd8-4005-83ae-a72d4331b47d,gpt-5-mini,openai,install-windows-3.11,7252,3907,11159,366.33384,False,0.0,gpt-5-mini,install-windows-3.11,366.33384,False,0.0,False,366.33384 +74a4f208-3c27-4f27-96bb-52c44f81778c,moonshotai/Kimi-K2-Instruct-0905,together_ai,nginx-request-logging,5918,4250,10168,487.801388,False,0.0,moonshotai/Kimi-K2-Instruct-0905,nginx-request-logging,487.801388,False,0.4,False,487.801388 +e427563b-6a0b-496a-81c2-19b1e8d77054,openai/gpt-oss-120b,together_ai,train-fasttext,12410,3780,16190,1430.868638,False,0.0,openai/gpt-oss-120b,train-fasttext,1430.868638,False,0.0,False,1430.868638 +b07b256a-1949-489f-8763-b2329326d1fc,claude-opus-4-1-20250805,anthropic,hf-model-inference,4548,3241,7789,616.661995,False,0.0,claude-opus-4-1-20250805,hf-model-inference,616.661995,False,0.25,False,616.661995 +fb7ce6a8-1731-4ba8-beaa-e05eeecbf57b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,merge-diff-arc-agi-task,11509,5060,16569,934.984083,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,merge-diff-arc-agi-task,934.984083,False,0.0,False,934.984083 +ccc90aa0-cf7a-4035-81cd-0f8466951ee7,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing,9836,6190,16026,191.306486,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing,191.306486,False,0.0,False,191.306486 +d55dee49-5c23-4134-9081-633c2b231440,deepseek-ai/DeepSeek-V3.1,together_ai,nginx-request-logging,4564,2101,6665,510.60575,False,0.0,deepseek-ai/DeepSeek-V3.1,nginx-request-logging,510.60575,False,0.4,False,510.60575 +43d41eec-c1ce-4811-a9f3-709100cf4b74,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,run-pdp11-code,3231,2340,5571,456.179936,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,run-pdp11-code,456.179936,False,0.0,False,456.179936 +f24f41b4-cc98-4e13-8806-ece358093e32,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-cli,9850,6012,15862,817.143022,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-cli,817.143022,False,0.0,False,817.143022 +aee19d22-795e-466b-add5-664de2494788,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,filter-js-from-html,1624,913,2537,21.252784,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,filter-js-from-html,21.252784,False,0.0,False,21.252784 +9110aac7-51a0-4e89-9762-bab6828604c4,deepseek-ai/DeepSeek-V3.1,together_ai,prove-plus-comm,2324,1675,3999,490.490105,True,1.0,deepseek-ai/DeepSeek-V3.1,prove-plus-comm,490.490105,True,1.0,True,490.490105 +ece24654-de34-4d17-8f2b-105a75802be4,gpt-5,openai,make-mips-interpreter,3016,32160,35176,1820.739403,False,0.0,gpt-5,make-mips-interpreter,1820.739403,False,0.0,False,1820.739403 +57b5a96c-276a-4199-ad96-d7759d0a4e32,gpt-5,openai,circuit-fibsqrt,19723,38645,58368,3606.389434,False,0.0,gpt-5,circuit-fibsqrt,3606.389434,False,0.6666666666666666,False,3606.389434 +3df39360-b769-4bf1-b365-32dc8564cc64,grok-code-fast-1,xai,extract-elf,1469,991,2460,91.67386,True,1.0,grok-code-fast-1,extract-elf,91.67386,True,0.6,True,91.67386 +70fe8fa7-e0a5-4062-aa04-419e348b19a3,moonshotai/Kimi-K2-Instruct-0905,together_ai,port-compressor,94596,58696,153292,2081.210711,False,0.0,moonshotai/Kimi-K2-Instruct-0905,port-compressor,2081.210711,False,0.0,False,2081.210711 +b47d132b-0864-458b-941a-c35c3025ecc0,deepseek-ai/DeepSeek-V3.1,together_ai,financial-document-processor,13521,4385,17906,354.047559,False,0.0,deepseek-ai/DeepSeek-V3.1,financial-document-processor,354.047559,False,0.0,False,354.047559 +d7656e62-144b-43f0-8f15-e61ca9299d66,grok-4-0709,xai,nginx-request-logging,4842,4344,9186,900.498498,True,1.0,grok-4-0709,nginx-request-logging,900.498498,True,1.0,True,900.498498 +fb0bcbd7-f53d-47f1-b5d1-2b3c22ec8ba6,grok-code-fast-1,xai,reverse-engineering,8069,4443,12512,773.107443,False,0.0,grok-code-fast-1,reverse-engineering,773.107443,False,0.0,False,773.107443 +521a60cb-9f6b-4c83-a43b-02f40515200d,claude-opus-4-1-20250805,anthropic,openssl-selfsigned-cert,3311,2646,5957,169.691858,True,1.0,claude-opus-4-1-20250805,openssl-selfsigned-cert,169.691858,True,1.0,True,169.691858 +e1e39383-bdb7-4ee7-beaa-ac30ab3fb79d,gpt-5-nano,openai,port-compressor,15798,23143,38941,3605.16392,False,0.0,gpt-5-nano,port-compressor,3605.16392,False,0.0,False,3605.16392 +f9d1aa7d-8bbd-440b-b0e0-fe8c09438f66,claude-opus-4-1-20250805,anthropic,install-windows-3.11,8471,2817,11288,272.578105,False,0.0,claude-opus-4-1-20250805,install-windows-3.11,272.578105,False,0.0,False,272.578105 +8a07ec33-5adb-425e-a29b-0341d2090844,gemini-2.5-flash,gemini,bn-fit-modify,38213,41273,79486,3639.357988,False,0.0,gemini-2.5-flash,bn-fit-modify,3639.357988,False,0.0,False,3639.357988 +b5e69394-6dd8-42d4-b61c-b943337d39c3,gpt-5,openai,feal-linear-cryptanalysis,7300,4073,11373,908.290389,True,1.0,gpt-5,feal-linear-cryptanalysis,908.290389,True,1.0,True,908.290389 +1db1dc95-9af0-4cf1-b72c-3eb59b9c4e7d,OpenAI/gpt-oss-20B,together_ai,reshard-c4-data,1437,1950,3387,150.391438,False,0.0,OpenAI/gpt-oss-20B,reshard-c4-data,150.391438,False,0.0,False,150.391438 +5eb80d76-1da9-499e-bba9-8c4418cbdac5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,adaptive-rejection-sampler,11780,3505,15285,452.566367,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,adaptive-rejection-sampler,452.566367,False,0.0,False,452.566367 +ee777adb-bd45-4d0a-811d-3814eaae0c3d,OpenAI/gpt-oss-20B,together_ai,make-mips-interpreter,6664,27111,33775,1807.920061,False,0.0,OpenAI/gpt-oss-20B,make-mips-interpreter,1807.920061,False,0.0,False,1807.920061 +17fc11cb-44ae-467b-b3f5-70f6356768d6,gpt-5-nano,openai,distribution-search,34246,44430,78676,3605.859821,False,0.0,gpt-5-nano,distribution-search,3605.859821,False,0.25,False,3605.859821 +c529bee6-4438-4267-989c-ab9b5898be10,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,prove-plus-comm,1402,1181,2583,277.914475,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,prove-plus-comm,277.914475,False,0.0,False,277.914475 +5d8e8b0d-b08b-4f19-8aba-c4c3f4c5218c,claude-sonnet-4-20250514,anthropic,run-pdp11-code,1946,1142,3088,1001.265534,False,0.0,claude-sonnet-4-20250514,run-pdp11-code,1001.265534,False,0.0,False,1001.265534 +5e1c948c-844a-4a8c-8365-a0fbb4e59453,OpenAI/gpt-oss-20B,together_ai,form-filling,200,1570,1770,107.531632,False,0.0,OpenAI/gpt-oss-20B,form-filling,107.531632,False,0.0,False,107.531632 +e258f068-1643-497f-ab31-bbfdfa81ce10,gpt-5-nano,openai,polyglot-rust-c,1718,1754,3472,308.956451,False,0.0,gpt-5-nano,polyglot-rust-c,308.956451,False,0.0,False,308.956451 +fc2922a6-caf1-43be-9431-10eba3aac8b7,gpt-5-nano,openai,constraints-scheduling,10805,15904,26709,1200.008872,False,0.0,gpt-5-nano,constraints-scheduling,1200.008872,False,0.4,False,1200.008872 +1bc29876-46a9-4dc2-a58a-55ce61e57bc4,zai-org/GLM-4.5-Air-FP8,together_ai,pypi-server,3582,1756,5338,361.469137,False,0.0,zai-org/GLM-4.5-Air-FP8,pypi-server,361.469137,False,0.2,False,361.469137 +1fa7a8d7-eb31-4308-b71b-2075a92e0f51,claude-opus-4-1-20250805,anthropic,install-klee-minimal,13021,1610,14631,923.610495,False,0.0,claude-opus-4-1-20250805,install-klee-minimal,923.610495,False,0.0,False,923.610495 +f912fa47-df61-49c9-a31c-a11b2afce051,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,filter-js-from-html,2456,1758,4214,67.69575,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,filter-js-from-html,67.69575,False,0.0,False,67.69575 +fd44c5eb-2a25-4727-a1af-132a49b9d806,gemini-2.5-flash,gemini,pytorch-model-recovery,12546,10807,23353,910.551912,False,0.0,gemini-2.5-flash,pytorch-model-recovery,910.551912,False,0.2,False,910.551912 +2fba23b9-6920-41e2-ba80-5baae420cd47,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-code-vulnerability,15037,5074,20111,900.055103,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-code-vulnerability,900.055103,False,0.0,False,900.055103 +13e970cf-3aa0-47ab-8c9a-303ec4e7b4ab,OpenAI/gpt-oss-20B,together_ai,dna-assembly,3280,10230,13510,721.18646,False,0.0,OpenAI/gpt-oss-20B,dna-assembly,721.18646,False,0.0,False,721.18646 +467c27cc-4a7c-42e4-b52e-40b29d1744ff,deepseek-ai/DeepSeek-V3.1,together_ai,largest-eigenval,7371,6318,13689,739.444421,False,0.0,deepseek-ai/DeepSeek-V3.1,largest-eigenval,739.444421,False,0.2,False,739.444421 +761d588c-a9b6-4ce8-87ee-27c6ec8d6851,OpenAI/gpt-oss-20B,together_ai,qemu-startup,1479,1827,3306,43.907312,False,0.0,OpenAI/gpt-oss-20B,qemu-startup,43.907312,False,0.0,False,43.907312 +d28f6ef7-a454-41a2-9937-a1473052751d,gemini-2.5-pro,gemini,log-summary-date-ranges,7080,1744,8824,210.256406,False,0.0,gemini-2.5-pro,log-summary-date-ranges,210.256406,False,0.0,False,210.256406 +c026bb4f-9718-431e-80f8-a2a9705c6356,grok-code-fast-1,xai,run-pdp11-code,2569,1884,4453,289.745059,False,0.0,grok-code-fast-1,run-pdp11-code,289.745059,False,0.0,False,289.745059 +83707105-078e-45b3-ac52-7d32d7067d23,gemini-2.5-flash,gemini,schemelike-metacircular-eval,6005,4129,10134,406.40546,False,0.0,gemini-2.5-flash,schemelike-metacircular-eval,406.40546,False,0.2,False,406.40546 +e0d295a4-a48f-4d07-8014-fb0ba5dd65bb,gemini-2.5-flash,gemini,sparql-university,1563,808,2371,116.44352,False,0.0,gemini-2.5-flash,sparql-university,116.44352,False,0.0,False,116.44352 +235287e7-1b7d-45ec-a9d6-16275623fa2b,moonshotai/Kimi-K2-Instruct-0905,together_ai,gpt2-codegolf,3463,3642,7105,462.656621,False,0.0,moonshotai/Kimi-K2-Instruct-0905,gpt2-codegolf,462.656621,False,0.0,False,462.656621 +8dcf4c5e-4ff7-45d9-9cc3-2f210e7b6330,gemini-2.5-flash,gemini,video-processing,2550,1969,4519,144.336566,False,0.0,gemini-2.5-flash,video-processing,144.336566,False,0.0,False,144.336566 +1aac18c2-72b0-4cff-b235-be3d00e77c73,zai-org/GLM-4.5-Air-FP8,together_ai,git-leak-recovery,2311,2071,4382,110.732175,True,1.0,zai-org/GLM-4.5-Air-FP8,git-leak-recovery,110.732175,True,0.8,True,110.732175 +61c1ebd6-ecd2-4589-aba4-dc0e8e9103bd,openai/gpt-oss-120b,together_ai,gpt2-codegolf,1718,2945,4663,213.935991,False,0.0,openai/gpt-oss-120b,gpt2-codegolf,213.935991,False,0.0,False,213.935991 +2c1c8620-33bb-4f7a-9e26-afca1ae296b3,openai/gpt-oss-120b,together_ai,hf-model-inference,3286,2347,5633,344.412713,False,0.0,openai/gpt-oss-120b,hf-model-inference,344.412713,False,0.0,False,344.412713 +99491274-4346-4e7c-a348-ac0036295123,grok-code-fast-1,xai,distribution-search,1590,1432,3022,218.328378,False,0.0,grok-code-fast-1,distribution-search,218.328378,False,0.0,False,218.328378 +00265c1a-6913-40d1-98bb-cb160f2425b3,OpenAI/gpt-oss-20B,together_ai,polyglot-rust-c,576,732,1308,65.929719,False,0.0,OpenAI/gpt-oss-20B,polyglot-rust-c,65.929719,False,0.0,False,65.929719 +b74023c2-0b20-451f-be53-7d2f0a7fc85d,gpt-5-nano,openai,sqlite-db-truncate,6147,5445,11592,904.584648,False,0.0,gpt-5-nano,sqlite-db-truncate,904.584648,False,0.0,False,904.584648 +bbd9c1fc-ec46-4167-a537-7462c28bc918,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-insert,23056,4988,28044,203.638627,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-insert,203.638627,False,0.0,False,203.638627 +9158073a-b01f-4bb3-b142-92498bcedcf8,gpt-5-nano,openai,wasm-pipeline,8651,7909,16560,906.744493,False,0.0,gpt-5-nano,wasm-pipeline,906.744493,False,0.0,False,906.744493 +daf5cf88-434c-4e51-9abe-26786ffb8be1,OpenAI/gpt-oss-20B,together_ai,sanitize-git-repo,223,1778,2001,102.378839,False,0.0,OpenAI/gpt-oss-20B,sanitize-git-repo,102.378839,False,0.0,False,102.378839 +949a7f4c-8af3-4cdd-86ff-0aa5c51bab27,openai/gpt-oss-120b,together_ai,sparql-university,4738,996,5734,55.441049,False,0.0,openai/gpt-oss-120b,sparql-university,55.441049,False,0.0,False,55.441049 +a72353b9-8e9e-4429-a162-4a881f617712,gemini-2.5-flash,gemini,form-filling,15162,30492,45654,901.56128,False,0.0,gemini-2.5-flash,form-filling,901.56128,False,0.0,False,901.56128 +69910ede-e92f-479c-8f2a-7d02ef9d1f6c,deepseek-ai/DeepSeek-V3.1,together_ai,bn-fit-modify,13264,7334,20598,805.205108,False,0.0,deepseek-ai/DeepSeek-V3.1,bn-fit-modify,805.205108,False,0.0,False,805.205108 +7c6e1ea2-5271-46a9-8423-a481df3d362c,openai/gpt-oss-120b,together_ai,financial-document-processor,4049,4212,8261,149.308662,False,0.0,openai/gpt-oss-120b,financial-document-processor,149.308662,False,0.0,False,149.308662 +3100b553-e2f6-479c-9fcd-43164b4b5382,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pov-ray,12974,3559,16533,508.419533,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pov-ray,508.419533,False,0.0,False,508.419533 +3d882f34-d6a5-4838-9b32-c13118dace70,openai/gpt-oss-120b,together_ai,nginx-request-logging,3769,1045,4814,128.177112,True,1.0,openai/gpt-oss-120b,nginx-request-logging,128.177112,True,0.4,True,128.177112 +2bde6e26-cef3-4c39-beec-af16e99dcea2,gpt-5,openai,build-pmars,13376,4361,17737,618.237492,True,1.0,gpt-5,build-pmars,618.237492,True,0.8,True,618.237492 +9c253fb8-8230-4a81-9939-e549a065a59d,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-retrieve,2287,1604,3891,247.913123,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-retrieve,247.913123,False,0.0,False,247.913123 +73862c80-9049-4cc8-9b69-1dff8c4742ae,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sanitize-git-repo,2848,1292,4140,133.443598,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sanitize-git-repo,133.443598,False,0.0,False,133.443598 +f0ef115c-7434-4c6e-b7e9-c636519f3e05,gemini-2.5-pro,gemini,nginx-request-logging,3819,1497,5316,255.212445,True,1.0,gemini-2.5-pro,nginx-request-logging,255.212445,True,0.6,True,255.212445 +f85dbfdc-dc8c-4516-b2b6-b1c35c5297f6,openai/gpt-oss-120b,together_ai,mteb-leaderboard,1120,1306,2426,133.259922,False,0.0,openai/gpt-oss-120b,mteb-leaderboard,133.259922,False,0.0,False,133.259922 +11694e05-dd39-4133-90d4-44b0a3c2c831,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-db-truncate,4373,2506,6879,696.839561,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-db-truncate,696.839561,False,0.0,False,696.839561 +eeab8b70-db97-416b-ac6b-41fc31c0f0d1,zai-org/GLM-4.5-Air-FP8,together_ai,vulnerable-secret,6897,14898,21795,907.118781,False,0.0,zai-org/GLM-4.5-Air-FP8,vulnerable-secret,907.118781,False,0.0,False,907.118781 +f52f0682-0868-4a95-b8d3-993e5b0193d6,gpt-5-nano,openai,feal-differential-cryptanalysis,4995,4854,9849,287.896496,False,0.0,gpt-5-nano,feal-differential-cryptanalysis,287.896496,False,0.0,False,287.896496 +1ddb6f62-5437-4951-96ae-6d69b770cf5d,deepseek-ai/DeepSeek-V3.1,together_ai,sparql-university,5973,3134,9107,393.138564,False,0.0,deepseek-ai/DeepSeek-V3.1,sparql-university,393.138564,False,0.0,False,393.138564 +3408c973-f574-4cd5-9135-13cf8f789daa,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cobol-modernization,9334,7378,16712,668.916419,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cobol-modernization,668.916419,True,0.4,True,668.916419 +6fd820be-b25e-4425-9c6e-5c63969c1065,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-ocaml-gc,120534,26712,147246,3602.848726,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-ocaml-gc,3602.848726,False,0.0,False,3602.848726 +3ea753e1-fe93-4202-af79-4ab725485edf,OpenAI/gpt-oss-20B,together_ai,chess-best-move,974,450,1424,54.659025,False,0.0,OpenAI/gpt-oss-20B,chess-best-move,54.659025,False,0.0,False,54.659025 +c76fac31-7b71-4ebb-a593-c72fb75245d9,OpenAI/gpt-oss-20B,together_ai,polyglot-rust-c,159,909,1068,287.065675,False,0.0,OpenAI/gpt-oss-20B,polyglot-rust-c,287.065675,False,0.0,False,287.065675 +fdd94540-7594-49a7-bb23-783acb52fe21,OpenAI/gpt-oss-20B,together_ai,crack-7z-hash,1009,1278,2287,44.670902,False,0.0,OpenAI/gpt-oss-20B,crack-7z-hash,44.670902,False,0.0,False,44.670902 +4175eb1f-77b0-446d-900b-20e108dbe947,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,constraints-scheduling,15124,10306,25430,769.9245,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,constraints-scheduling,769.9245,False,0.0,False,769.9245 +c9d9ef1d-5312-4365-8b44-93d143d8df84,zai-org/GLM-4.5-Air-FP8,together_ai,bn-fit-modify,18451,10491,28942,661.523861,False,0.0,zai-org/GLM-4.5-Air-FP8,bn-fit-modify,661.523861,False,0.0,False,661.523861 +47386a09-06c2-42dc-82c7-3403a9b34349,claude-sonnet-4-20250514,anthropic,polyglot-rust-c,10279,11060,21339,901.27832,False,0.0,claude-sonnet-4-20250514,polyglot-rust-c,901.27832,False,0.0,False,901.27832 +08e75dd0-5878-4a1d-89fe-b79780f11dc1,claude-sonnet-4-20250514,anthropic,largest-eigenval,9686,7392,17078,902.578683,False,0.0,claude-sonnet-4-20250514,largest-eigenval,902.578683,False,0.0,False,902.578683 +c648a06e-140c-4bf5-b25d-3e1774847bc4,claude-opus-4-1-20250805,anthropic,distribution-search,31899,42487,74386,1513.986603,True,1.0,claude-opus-4-1-20250805,distribution-search,1513.986603,True,0.5555555555555556,True,1513.986603 +f13f733e-e7af-4fa3-97d3-fdba0af836ae,claude-sonnet-4-20250514,anthropic,make-mips-interpreter,45092,41152,86244,1816.518797,False,0.0,claude-sonnet-4-20250514,make-mips-interpreter,1816.518797,False,0.0,False,1816.518797 +4a198c09-9a36-431c-8b87-9bfec3e599a4,gpt-5-mini,openai,form-filling,12609,12611,25220,370.006002,True,1.0,gpt-5-mini,form-filling,370.006002,True,1.0,True,370.006002 +f932b575-ef40-4f3a-9133-6208bf3e0a24,gemini-2.5-flash,gemini,port-compressor,52696,80070,132766,3632.902595,False,0.0,gemini-2.5-flash,port-compressor,3632.902595,False,0.0,False,3632.902595 +e7db87ce-d6f7-4932-9f01-6f1dc5210108,gemini-2.5-flash,gemini,nginx-request-logging,2026,11128,13154,923.493182,False,0.0,gemini-2.5-flash,nginx-request-logging,923.493182,False,0.0,False,923.493182 +c3b7988a-8d10-436b-8773-043aec47950b,gpt-5-mini,openai,run-pdp11-code,2573,1479,4052,258.077195,False,0.0,gpt-5-mini,run-pdp11-code,258.077195,False,0.0,False,258.077195 +529149a0-446d-4b3f-a6c9-fb67935eb125,gemini-2.5-flash,gemini,write-compressor,10312,25267,35579,900.860191,False,0.0,gemini-2.5-flash,write-compressor,900.860191,False,0.0,False,900.860191 +59204e86-ce9d-4ffd-a483-16166feb1b11,OpenAI/gpt-oss-20B,together_ai,pytorch-model-cli,682,1789,2471,231.397258,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-cli,231.397258,False,0.0,False,231.397258 +36b00af7-a0f8-49c5-993d-b1a1fd35beb0,gpt-5,openai,merge-diff-arc-agi-task,7927,5911,13838,254.343024,True,1.0,gpt-5,merge-diff-arc-agi-task,254.343024,True,1.0,True,254.343024 +4eef11eb-05b9-45d2-84df-259ca47465ac,gemini-2.5-flash,gemini,torch-tensor-parallelism,2232,3989,6221,367.071263,False,0.0,gemini-2.5-flash,torch-tensor-parallelism,367.071263,False,0.0,False,367.071263 +ae3138f0-2540-4371-b691-427e74741a24,claude-sonnet-4-20250514,anthropic,make-mips-interpreter,29116,20200,49316,1804.113501,False,0.0,claude-sonnet-4-20250514,make-mips-interpreter,1804.113501,False,0.0,False,1804.113501 +aa1572f4-169c-4092-912b-52f3d2f28782,openai/gpt-oss-120b,together_ai,bn-fit-modify,2629,2576,5205,274.847726,False,0.0,openai/gpt-oss-120b,bn-fit-modify,274.847726,False,0.2,False,274.847726 +4e3a4215-049d-47d9-a8ac-a3632ab8024d,grok-code-fast-1,xai,extract-elf,3242,2127,5369,282.526449,True,1.0,grok-code-fast-1,extract-elf,282.526449,True,0.6,True,282.526449 +3e08f3b9-29d6-4997-bdd6-d714f8637602,grok-code-fast-1,xai,nginx-request-logging,3708,1975,5683,78.482906,False,0.0,grok-code-fast-1,nginx-request-logging,78.482906,False,0.0,False,78.482906 +591ef413-f093-4569-89b0-8f032a8d11fe,deepseek-ai/DeepSeek-V3.1,together_ai,cancel-async-tasks,2060,1160,3220,162.553326,True,1.0,deepseek-ai/DeepSeek-V3.1,cancel-async-tasks,162.553326,True,0.4,True,162.553326 +6bbed1dc-90b6-49e1-b51b-9421dd2357a7,gpt-5-nano,openai,pypi-server,3705,1910,5615,153.238482,True,1.0,gpt-5-nano,pypi-server,153.238482,True,0.8,True,153.238482 +1ee4effa-e62b-4eee-91f2-ddf6a6db9821,grok-4-0709,xai,vulnerable-secret,7337,4121,11458,900.19694,False,0.0,grok-4-0709,vulnerable-secret,900.19694,False,0.6,False,900.19694 +65498ab0-8c5a-440e-b1f9-a4ce470026d6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,crack-7z-hash,3058,1658,4716,265.532981,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,crack-7z-hash,265.532981,False,0.0,False,265.532981 +88844d79-705c-4a91-b046-d139020d8ace,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-klee-minimal,14418,1807,16225,900.02768,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-klee-minimal,900.02768,False,0.0,False,900.02768 +689b6712-a73d-42e5-8dfb-45303790a1dd,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,nginx-request-logging,7220,4276,11496,1028.651128,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,nginx-request-logging,1028.651128,False,0.4,False,1028.651128 +06f0e241-6d28-48e4-bd5f-f9b89cacceaf,deepseek-ai/DeepSeek-V3.1,together_ai,train-fasttext,11798,6250,18048,3246.338034,False,0.0,deepseek-ai/DeepSeek-V3.1,train-fasttext,3246.338034,False,0.0,False,3246.338034 +4998705f-dfc2-4d43-9bca-1d2b5bd7d83d,gemini-2.5-pro,gemini,crack-7z-hash,12846,3452,16298,327.452375,True,1.0,gemini-2.5-pro,crack-7z-hash,327.452375,True,0.8,True,327.452375 +d5039454-20af-4a8e-8045-2c85406377ca,claude-sonnet-4-20250514,anthropic,fix-ocaml-gc,24813,8403,33216,1277.170482,False,0.0,claude-sonnet-4-20250514,fix-ocaml-gc,1277.170482,False,0.0,False,1277.170482 +e9ffdf80-dcfa-4a1d-8d5e-6768219b907a,zai-org/GLM-4.5-Air-FP8,together_ai,form-filling,5662,5066,10728,309.418837,True,1.0,zai-org/GLM-4.5-Air-FP8,form-filling,309.418837,True,0.8,True,309.418837 +880441ee-3aec-43a7-baf3-293c25ad9eea,gpt-5-nano,openai,vulnerable-secret,9809,3899,13708,908.780874,False,0.0,gpt-5-nano,vulnerable-secret,908.780874,False,0.2,False,908.780874 +5b60c6ed-f72d-44e0-9f34-6841be37abb2,grok-4-0709,xai,polyglot-rust-c,0,0,0,926.205025,False,0.0,grok-4-0709,polyglot-rust-c,926.205025,False,0.0,False,926.205025 +af16970b-760f-4caf-aa56-b55320bc0afd,deepseek-ai/DeepSeek-V3.1,together_ai,feal-differential-cryptanalysis,9099,9287,18386,552.497041,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-differential-cryptanalysis,552.497041,False,0.0,False,552.497041 +43f117d1-4663-4dd6-b0c4-79bd41ec21d1,deepseek-ai/DeepSeek-V3.1,together_ai,nginx-request-logging,6484,3842,10326,411.122519,False,0.0,deepseek-ai/DeepSeek-V3.1,nginx-request-logging,411.122519,False,0.4,False,411.122519 +ca358afb-ab6e-452c-8dd2-534056b29c16,zai-org/GLM-4.5-Air-FP8,together_ai,constraints-scheduling,5703,5672,11375,458.157091,True,1.0,zai-org/GLM-4.5-Air-FP8,constraints-scheduling,458.157091,True,0.8,True,458.157091 +36866639-1694-4a12-8ef2-06869295a9e1,openai/gpt-oss-120b,together_ai,polyglot-rust-c,2621,6305,8926,928.696927,False,0.0,openai/gpt-oss-120b,polyglot-rust-c,928.696927,False,0.0,False,928.696927 +01ee34f8-ada5-4462-8793-233fe6f4a60e,claude-sonnet-4-20250514,anthropic,largest-eigenval,10919,9097,20016,903.644081,False,0.0,claude-sonnet-4-20250514,largest-eigenval,903.644081,False,0.0,False,903.644081 +524f0260-b55b-4443-ab46-42601de929cc,gemini-2.5-pro,gemini,qemu-alpine-ssh,1895,1746,3641,252.888384,False,0.0,gemini-2.5-pro,qemu-alpine-ssh,252.888384,False,0.2,False,252.888384 +478f169d-bf19-454b-9ef1-92823cfc118e,gpt-5,openai,build-pmars,9368,2583,11951,420.529629,True,1.0,gpt-5,build-pmars,420.529629,True,0.8,True,420.529629 +8afc75a0-d7fa-476a-8446-a550a85dfed3,OpenAI/gpt-oss-20B,together_ai,adaptive-rejection-sampler,1792,1857,3649,143.258045,False,0.0,OpenAI/gpt-oss-20B,adaptive-rejection-sampler,143.258045,False,0.0,False,143.258045 +f69277b5-c127-47d3-8c69-678d7011c3b3,gpt-5,openai,sanitize-git-repo,13890,5574,19464,687.354037,True,1.0,gpt-5,sanitize-git-repo,687.354037,True,0.2857142857142857,True,687.354037 +0a4ae6e3-6cce-4e26-ab2d-5287e007dc31,grok-code-fast-1,xai,run-pdp11-code,2167,1836,4003,778.566592,False,0.0,grok-code-fast-1,run-pdp11-code,778.566592,False,0.0,False,778.566592 +3d16d4f1-087b-4562-9a9f-4b1bdf96aa73,openai/gpt-oss-120b,together_ai,configure-git-webserver,1699,1375,3074,209.571504,False,0.0,openai/gpt-oss-120b,configure-git-webserver,209.571504,False,0.6,False,209.571504 +f382387a-f40c-4c84-a149-9b29cd49a982,gpt-5-nano,openai,largest-eigenval,4420,3549,7969,962.463437,False,0.0,gpt-5-nano,largest-eigenval,962.463437,False,0.0,False,962.463437 +67e5c801-6eae-491d-b3bb-74a6ed2e3114,gemini-2.5-pro,gemini,dna-insert,5057,1011,6068,364.122258,False,0.0,gemini-2.5-pro,dna-insert,364.122258,False,0.0,False,364.122258 +e6bca75e-550b-4a78-ad5a-9753313964bc,grok-code-fast-1,xai,run-pdp11-code,2303,2305,4608,168.64466,False,0.0,grok-code-fast-1,run-pdp11-code,168.64466,False,0.0,False,168.64466 +a5ee2eba-2af4-44fe-9b12-69b3bce53268,gpt-5,openai,cobol-modernization,6141,5526,11667,426.111141,True,1.0,gpt-5,cobol-modernization,426.111141,True,1.0,True,426.111141 +07cbeece-e396-4b98-9ba3-fb3496789e57,claude-opus-4-1-20250805,anthropic,torch-tensor-parallelism,4882,3790,8672,147.162879,False,0.0,claude-opus-4-1-20250805,torch-tensor-parallelism,147.162879,False,0.0,False,147.162879 +7def81f5-d4e3-43d4-9ca2-d5e1f33541a8,gemini-2.5-pro,gemini,winning-avg-corewars,11625,15731,27356,1339.260448,False,0.0,gemini-2.5-pro,winning-avg-corewars,1339.260448,False,0.0,False,1339.260448 +00b0e268-080e-4a30-bb5f-921019fa3797,claude-sonnet-4-20250514,anthropic,path-tracing,5605,4534,10139,532.645955,False,0.0,claude-sonnet-4-20250514,path-tracing,532.645955,False,0.0,False,532.645955 +66d7d325-0c65-4beb-aec6-e109d97d67e9,claude-sonnet-4-20250514,anthropic,code-from-image,4874,4876,9750,347.249671,False,0.0,claude-sonnet-4-20250514,code-from-image,347.249671,False,0.2,False,347.249671 +c3775e21-dc38-4cbf-8093-c659a6ffca66,claude-opus-4-1-20250805,anthropic,configure-git-webserver,5559,1752,7311,125.583902,False,0.0,claude-opus-4-1-20250805,configure-git-webserver,125.583902,False,0.625,False,125.583902 +6ec28ab7-d65a-46e3-9029-5aefe40b8c44,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,run-pdp11-code,7332,6073,13405,1016.778645,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,run-pdp11-code,1016.778645,False,0.0,False,1016.778645 +76cecade-671c-4521-bd1c-28b05718238b,OpenAI/gpt-oss-20B,together_ai,largest-eigenval,376,2520,2896,165.682031,False,0.0,OpenAI/gpt-oss-20B,largest-eigenval,165.682031,False,0.0,False,165.682031 +379e18f3-942a-4915-b113-42d444932bc7,gemini-2.5-pro,gemini,mteb-leaderboard,49814,19385,69199,3606.706124,False,0.0,gemini-2.5-pro,mteb-leaderboard,3606.706124,False,0.0,False,3606.706124 +fd1d2ad9-8e48-482a-bbf8-13e6ea132bb5,gemini-2.5-pro,gemini,log-summary-date-ranges,7320,1790,9110,114.233689,False,0.0,gemini-2.5-pro,log-summary-date-ranges,114.233689,False,0.0,False,114.233689 +ff8cb9a5-0d28-43d6-856f-30f8acede506,gpt-5-nano,openai,prove-plus-comm,3499,4296,7795,900.001055,False,0.0,gpt-5-nano,prove-plus-comm,900.001055,False,0.4,False,900.001055 +fab8b80d-b3df-45d6-a613-57241b5d125d,claude-sonnet-4-20250514,anthropic,model-extraction-relu-logits,12586,11045,23631,706.415487,False,0.0,claude-sonnet-4-20250514,model-extraction-relu-logits,706.415487,False,0.0,False,706.415487 +5dd26334-3994-44f9-8a89-2301ddbf7ef0,gpt-5-mini,openai,pytorch-model-cli,1656,1236,2892,91.107201,False,0.0,gpt-5-mini,pytorch-model-cli,91.107201,False,0.0,False,91.107201 +dc758f7d-3f57-4366-863d-254582068199,claude-opus-4-1-20250805,anthropic,build-cython-ext,22695,10051,32746,900.239924,False,0.0,claude-opus-4-1-20250805,build-cython-ext,900.239924,False,0.0,False,900.239924 +bfb9b1fc-26f4-42e1-b2d3-a49bbadf4b95,OpenAI/gpt-oss-20B,together_ai,gpt2-codegolf,2445,6754,9199,774.970246,False,0.0,OpenAI/gpt-oss-20B,gpt2-codegolf,774.970246,False,0.0,False,774.970246 +83f43bf6-9c3d-4b94-a868-e3bc947d5a29,OpenAI/gpt-oss-20B,together_ai,feal-linear-cryptanalysis,7379,36953,44332,1814.977613,False,0.0,OpenAI/gpt-oss-20B,feal-linear-cryptanalysis,1814.977613,False,0.0,False,1814.977613 +c8c4f4fd-d5d2-4a2f-bd20-4dd7fe3c1969,grok-code-fast-1,xai,mteb-retrieve,1921,842,2763,139.967001,False,0.0,grok-code-fast-1,mteb-retrieve,139.967001,False,0.0,False,139.967001 +8a1640df-dad4-4f97-9c51-a6f305b4f582,claude-opus-4-1-20250805,anthropic,gpt2-codegolf,10275,9715,19990,900.099502,False,0.0,claude-opus-4-1-20250805,gpt2-codegolf,900.099502,False,0.0,False,900.099502 +1c15cc11-ba44-4d52-ad7e-a73a84f059e4,grok-4-0709,xai,filter-js-from-html,931,981,1912,319.098513,False,0.0,grok-4-0709,filter-js-from-html,319.098513,False,0.0,False,319.098513 +f4e2e17b-4463-468e-9b50-5b197465dd0b,claude-sonnet-4-20250514,anthropic,train-fasttext,58646,14064,72710,3606.13041,False,0.0,claude-sonnet-4-20250514,train-fasttext,3606.13041,False,0.0,False,3606.13041 +7ac18365-fbee-46f4-9c71-a026fe955df2,openai/gpt-oss-120b,together_ai,feal-differential-cryptanalysis,1657,1817,3474,247.940154,False,0.0,openai/gpt-oss-120b,feal-differential-cryptanalysis,247.940154,False,0.0,False,247.940154 +e929db16-6bfa-4b68-9b0e-1d59c45bfb71,claude-sonnet-4-20250514,anthropic,polyglot-c-py,2262,2237,4499,120.665617,False,0.0,claude-sonnet-4-20250514,polyglot-c-py,120.665617,False,0.0,False,120.665617 +555b77eb-5c3d-4a4e-b4c9-ea03b9be4b2c,gemini-2.5-flash,gemini,port-compressor,127033,120515,247548,3600.001834,False,0.0,gemini-2.5-flash,port-compressor,3600.001834,False,0.0,False,3600.001834 +1d4e99e1-3062-4b25-839a-18b3e1d9179c,claude-opus-4-1-20250805,anthropic,fix-ocaml-gc,34230,14752,48982,2020.377457,True,1.0,claude-opus-4-1-20250805,fix-ocaml-gc,2020.377457,True,0.5,True,2020.377457 +87463878-f622-4fa2-9a55-ee58363edc97,gemini-2.5-pro,gemini,filter-js-from-html,1452,874,2326,95.371836,False,0.0,gemini-2.5-pro,filter-js-from-html,95.371836,False,0.0,False,95.371836 +7a49235b-1b2f-484d-921b-9ea63dab8d0f,moonshotai/Kimi-K2-Instruct-0905,together_ai,reverse-engineering,10046,4351,14397,328.351121,True,1.0,moonshotai/Kimi-K2-Instruct-0905,reverse-engineering,328.351121,True,0.2,True,328.351121 +4a36f880-8c1c-4050-8338-d3f08073109e,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,video-processing,1858,3844,5702,208.550899,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,video-processing,208.550899,False,0.0,False,208.550899 +05ff8ea1-61c4-4641-b55e-aa6c64e64095,gpt-5,openai,mteb-leaderboard,13472,8106,21578,1002.181577,False,0.0,gpt-5,mteb-leaderboard,1002.181577,False,0.0,False,1002.181577 +d9cdb001-d9ce-45ad-92ff-481a1abc6d54,moonshotai/Kimi-K2-Instruct-0905,together_ai,large-scale-text-editing,14751,7627,22378,1211.197888,False,0.0,moonshotai/Kimi-K2-Instruct-0905,large-scale-text-editing,1211.197888,False,0.0,False,1211.197888 +00a18e70-ca97-4d39-9498-a6abc8b5772d,grok-4-0709,xai,install-klee-minimal,7922,2186,10108,900.017379,False,0.0,grok-4-0709,install-klee-minimal,900.017379,False,0.0,False,900.017379 +83d46178-f3cb-416a-989b-674ac1c8c59b,claude-opus-4-1-20250805,anthropic,dna-insert,5771,3370,9141,366.177928,False,0.0,claude-opus-4-1-20250805,dna-insert,366.177928,False,0.0,False,366.177928 +9d500747-e08e-404b-98eb-9307a901745d,deepseek-ai/DeepSeek-V3.1,together_ai,fix-ocaml-gc,50510,22369,72879,2767.206252,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-ocaml-gc,2767.206252,False,0.0,False,2767.206252 +e2cc6cfd-8a05-4d21-9a29-6101193986cb,grok-code-fast-1,xai,path-tracing-reverse,7612,7223,14835,778.868283,False,0.0,grok-code-fast-1,path-tracing-reverse,778.868283,False,0.0,False,778.868283 +3c480d88-4a55-44b1-af7d-46492ec5566e,gpt-5-nano,openai,git-leak-recovery,5360,5154,10514,458.77393,False,0.0,gpt-5-nano,git-leak-recovery,458.77393,False,0.0,False,458.77393 +5be71768-fa15-449d-b181-b3c3c0d61275,gemini-2.5-flash,gemini,torch-tensor-parallelism,2056,3391,5447,783.1688,False,0.0,gemini-2.5-flash,torch-tensor-parallelism,783.1688,False,0.0,False,783.1688 +1c72e7bd-15d9-4083-8d19-238f2b806d59,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,db-wal-recovery,6215,5815,12030,902.751639,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,db-wal-recovery,902.751639,False,0.0,False,902.751639 +23e2626c-010b-43ca-b41a-105e2e9743ff,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pov-ray,32342,9396,41738,4317.453263,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pov-ray,4317.453263,False,0.0,False,4317.453263 +040d3028-6b17-46a6-bdf1-818da5f3bd01,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pov-ray,19056,7282,26338,1043.830663,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pov-ray,1043.830663,True,0.2,True,1043.830663 +97c0c036-f35b-43bd-ad4e-361e13d3adf3,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-retrieve,2979,2165,5144,223.729267,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-retrieve,223.729267,False,0.0,False,223.729267 +83043e4e-97ee-4b66-b7c2-c57d6042fef3,gpt-5-mini,openai,nginx-request-logging,4248,1949,6197,177.985975,False,0.0,gpt-5-mini,nginx-request-logging,177.985975,False,0.4,False,177.985975 +4c9bf875-99a7-412f-8550-8dd08811189a,grok-code-fast-1,xai,feal-differential-cryptanalysis,2445,1545,3990,263.713261,False,0.0,grok-code-fast-1,feal-differential-cryptanalysis,263.713261,False,0.0,False,263.713261 +b7256ad5-b158-4c4c-a710-7128603f531e,claude-sonnet-4-20250514,anthropic,nginx-request-logging,6537,4120,10657,254.527126,True,1.0,claude-sonnet-4-20250514,nginx-request-logging,254.527126,True,1.0,True,254.527126 +67f0de7a-25df-4e4b-8694-32235ee1275a,claude-sonnet-4-20250514,anthropic,polyglot-rust-c,9784,10504,20288,900.224497,False,0.0,claude-sonnet-4-20250514,polyglot-rust-c,900.224497,False,0.0,False,900.224497 +3b02795e-22c0-432b-90d8-703d409b8807,claude-opus-4-1-20250805,anthropic,fix-git,2809,1796,4605,215.462981,True,1.0,claude-opus-4-1-20250805,fix-git,215.462981,True,1.0,True,215.462981 +f02f5826-1638-4464-aa0e-4b7d551c05cd,claude-sonnet-4-20250514,anthropic,feal-differential-cryptanalysis,26383,26731,53114,1807.815899,False,0.0,claude-sonnet-4-20250514,feal-differential-cryptanalysis,1807.815899,False,0.0,False,1807.815899 +50335ce8-c241-4552-932f-270ce3c2edf6,gpt-5-nano,openai,polyglot-c-py,4537,11183,15720,900.234927,False,0.0,gpt-5-nano,polyglot-c-py,900.234927,False,0.0,False,900.234927 +b92f316d-8c02-4050-81d2-fabf60ac837a,openai/gpt-oss-120b,together_ai,db-wal-recovery,4481,8773,13254,938.49404,False,0.0,openai/gpt-oss-120b,db-wal-recovery,938.49404,False,0.0,False,938.49404 +537ace88-a5c4-473b-a497-625221d892f1,openai/gpt-oss-120b,together_ai,build-pmars,8834,3298,12132,900.935693,False,0.0,openai/gpt-oss-120b,build-pmars,900.935693,False,0.2,False,900.935693 +970711a8-9e14-463e-b651-7362ca3795f9,zai-org/GLM-4.5-Air-FP8,together_ai,merge-diff-arc-agi-task,37239,26374,63613,809.795325,False,0.0,zai-org/GLM-4.5-Air-FP8,merge-diff-arc-agi-task,809.795325,False,0.0,False,809.795325 +b421b0f4-1d85-46bc-98c4-edacde5964b3,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-code-vulnerability,17192,7218,24410,908.555324,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-code-vulnerability,908.555324,True,0.4,True,908.555324 +86a8c7a3-349a-4c60-b6b8-b52d6632fb14,moonshotai/Kimi-K2-Instruct-0905,together_ai,prove-plus-comm,2226,1854,4080,89.970492,True,1.0,moonshotai/Kimi-K2-Instruct-0905,prove-plus-comm,89.970492,True,0.8,True,89.970492 +7a2bf2b9-3b4c-43ca-86df-76c3df820431,gpt-5,openai,build-cython-ext,7992,4962,12954,923.773514,False,0.0,gpt-5,build-cython-ext,923.773514,False,0.0,False,923.773514 +93dab8c0-ef8d-4c05-afc1-05172496bc0d,gpt-5-nano,openai,largest-eigenval,5246,7975,13221,900.132336,False,0.0,gpt-5-nano,largest-eigenval,900.132336,False,0.0,False,900.132336 +afa1fbae-92d2-4a9a-9ed0-1ab236009e69,OpenAI/gpt-oss-20B,together_ai,regex-log,453,862,1315,48.893916,False,0.0,OpenAI/gpt-oss-20B,regex-log,48.893916,False,0.0,False,48.893916 +5729b407-921a-484f-b68e-3b562602a700,gemini-2.5-flash,gemini,prove-plus-comm,1861,2115,3976,90.077706,True,1.0,gemini-2.5-flash,prove-plus-comm,90.077706,True,0.6,True,90.077706 +291a8432-894a-4774-9239-1add40c4f689,deepseek-ai/DeepSeek-V3.1,together_ai,wasm-pipeline,2625,2777,5402,1025.70974,False,0.0,deepseek-ai/DeepSeek-V3.1,wasm-pipeline,1025.70974,False,0.4,False,1025.70974 +f0a06e59-3ed2-46db-a1c1-f4ea6e1ddd4f,zai-org/GLM-4.5-Air-FP8,together_ai,torch-tensor-parallelism,12952,4131,17083,904.424344,False,0.0,zai-org/GLM-4.5-Air-FP8,torch-tensor-parallelism,904.424344,False,0.0,False,904.424344 +0d6e0e62-c526-4ab5-aea5-c940724e5ed5,gpt-5-nano,openai,dna-assembly,7823,10219,18042,763.386427,False,0.0,gpt-5-nano,dna-assembly,763.386427,False,0.0,False,763.386427 +7c8dd4b4-aab5-4f7d-bf94-573bb0883b57,gemini-2.5-flash,gemini,video-processing,3916,3312,7228,211.800366,False,0.0,gemini-2.5-flash,video-processing,211.800366,False,0.0,False,211.800366 +c6bca54f-5b6e-407e-99d7-4cba2a003fdb,claude-opus-4-1-20250805,anthropic,sqlite-db-truncate,10000,5580,15580,176.837932,False,0.0,claude-opus-4-1-20250805,sqlite-db-truncate,176.837932,False,0.125,False,176.837932 +3dae731a-d189-4f14-bfa5-c1efb7d0d997,OpenAI/gpt-oss-20B,together_ai,feal-differential-cryptanalysis,1382,2050,3432,231.52774,False,0.0,OpenAI/gpt-oss-20B,feal-differential-cryptanalysis,231.52774,False,0.0,False,231.52774 +d3b1b785-6b03-48cb-a2d0-ebe693ff184c,grok-code-fast-1,xai,make-mips-interpreter,6642,6771,13413,508.010753,False,0.0,grok-code-fast-1,make-mips-interpreter,508.010753,False,0.0,False,508.010753 +a65d8adf-242f-44c0-ab05-37be5a37fc1f,claude-opus-4-1-20250805,anthropic,prove-plus-comm,1618,1288,2906,117.069819,True,1.0,claude-opus-4-1-20250805,prove-plus-comm,117.069819,True,1.0,True,117.069819 +933b3917-9a41-4b0d-8531-179c63a40e51,openai/gpt-oss-120b,together_ai,make-doom-for-mips,9168,4158,13326,900.576974,False,0.0,openai/gpt-oss-120b,make-doom-for-mips,900.576974,False,0.0,False,900.576974 +23485f97-ff71-42ec-a1f9-1efda9e5d771,OpenAI/gpt-oss-20B,together_ai,db-wal-recovery,1082,2233,3315,106.632391,False,0.0,OpenAI/gpt-oss-20B,db-wal-recovery,106.632391,False,0.0,False,106.632391 +43ea0245-e4c0-41a9-a3d2-91200c59460c,zai-org/GLM-4.5-Air-FP8,together_ai,torch-tensor-parallelism,2540,2475,5015,254.077497,False,0.0,zai-org/GLM-4.5-Air-FP8,torch-tensor-parallelism,254.077497,False,0.0,False,254.077497 +62e34087-ec30-47b3-a681-485b37ba4a35,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,count-dataset-tokens,7189,1904,9093,180.450189,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,count-dataset-tokens,180.450189,False,0.0,False,180.450189 +956f5e49-1099-4023-8aab-2b12bcf0a7d6,gpt-5,openai,distribution-search,3062,4090,7152,272.605554,True,1.0,gpt-5,distribution-search,272.605554,True,1.0,True,272.605554 +6e41832a-5685-48bb-abaf-6c677ff659a6,grok-code-fast-1,xai,pytorch-model-cli,2796,1217,4013,195.916782,False,0.0,grok-code-fast-1,pytorch-model-cli,195.916782,False,0.0,False,195.916782 +1766329d-0965-4567-931c-021b7ff46521,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-assembly,3559,3161,6720,508.706495,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-assembly,508.706495,False,0.0,False,508.706495 +13f66ada-763e-4105-bf66-b3e4bb97a38e,moonshotai/Kimi-K2-Instruct-0905,together_ai,largest-eigenval,4766,2777,7543,916.13923,False,0.0,moonshotai/Kimi-K2-Instruct-0905,largest-eigenval,916.13923,False,0.2,False,916.13923 +0a48e58a-60e1-427d-8751-98eae75a539d,gemini-2.5-flash,gemini,gpt2-codegolf,2025,3242,5267,386.891306,False,0.0,gemini-2.5-flash,gpt2-codegolf,386.891306,False,0.0,False,386.891306 +7aeec8db-253e-45cd-bfb6-7ec00db319cc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,reverse-engineering,8560,4211,12771,702.84289,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reverse-engineering,702.84289,False,0.0,False,702.84289 +d1a11941-1001-450e-a4d7-8255463153e1,grok-4-0709,xai,regex-log,1337,632,1969,326.288649,True,1.0,grok-4-0709,regex-log,326.288649,True,0.6,True,326.288649 +d99c5e9b-5ae4-4eb9-a4ca-85bbb5a843ed,gemini-2.5-flash,gemini,install-klee-minimal,17875,3890,21765,900.076384,False,0.0,gemini-2.5-flash,install-klee-minimal,900.076384,False,0.0,False,900.076384 +101724e9-43a8-4fd2-ac39-fa24325ebfe8,openai/gpt-oss-120b,together_ai,reshard-c4-data,12464,6440,18904,904.945609,False,0.0,openai/gpt-oss-120b,reshard-c4-data,904.945609,False,0.0,False,904.945609 +fa8b227a-424d-4e14-bcb3-322b741600ad,gpt-5-mini,openai,dna-assembly,11849,8974,20823,720.074785,False,0.0,gpt-5-mini,dna-assembly,720.074785,False,0.0,False,720.074785 +79c5c17d-a4e3-4af1-84f5-e1c8f19d6005,claude-opus-4-1-20250805,anthropic,git-leak-recovery,2927,1926,4853,135.387313,True,1.0,claude-opus-4-1-20250805,git-leak-recovery,135.387313,True,1.0,True,135.387313 +793c9421-dbf2-43ec-b371-98c8abf8e397,OpenAI/gpt-oss-20B,together_ai,financial-document-processor,888,1006,1894,45.209994,False,0.0,OpenAI/gpt-oss-20B,financial-document-processor,45.209994,False,0.0,False,45.209994 +ab2fd17a-7de8-4a23-88ad-9f91a509c143,OpenAI/gpt-oss-20B,together_ai,model-extraction-relu-logits,472,576,1048,224.200182,False,0.0,OpenAI/gpt-oss-20B,model-extraction-relu-logits,224.200182,False,0.0,False,224.200182 +ec41e45d-2ebc-4705-b687-3d358466633d,gpt-5,openai,extract-elf,2347,2418,4765,189.579897,True,1.0,gpt-5,extract-elf,189.579897,True,0.2857142857142857,True,189.579897 +a61f3994-527d-4adb-8aca-fc1eb3c11d24,OpenAI/gpt-oss-20B,together_ai,git-leak-recovery,1219,494,1713,29.240326,False,0.0,OpenAI/gpt-oss-20B,git-leak-recovery,29.240326,False,0.0,False,29.240326 +5a31e89e-d186-4eb6-9291-b334cd3a80a5,claude-sonnet-4-20250514,anthropic,pytorch-model-cli,5306,6210,11516,546.13274,False,0.0,claude-sonnet-4-20250514,pytorch-model-cli,546.13274,False,0.4,False,546.13274 +a3c97c9e-32d1-4d8c-9528-d2cea743ca93,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,video-processing,3566,2969,6535,82.390943,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,video-processing,82.390943,False,0.0,False,82.390943 +0fde5abe-52f2-40d9-ab14-cf9c19ae97e1,gpt-5-nano,openai,bn-fit-modify,8452,8119,16571,542.463067,False,0.0,gpt-5-nano,bn-fit-modify,542.463067,False,0.0,False,542.463067 +4424ef95-e7a5-4ef2-8bfd-a277a0257087,grok-4-0709,xai,build-pmars,13749,4805,18554,818.704025,False,0.0,grok-4-0709,build-pmars,818.704025,False,0.2,False,818.704025 +e56e2182-7af5-4dde-8cad-0c555badbfcd,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-cli,7873,1422,9295,134.009373,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-cli,134.009373,False,0.0,False,134.009373 +404fa14c-bdc6-4a87-9fcf-46b988f4ced9,moonshotai/Kimi-K2-Instruct-0905,together_ai,cobol-modernization,3418,3430,6848,919.764676,True,1.0,moonshotai/Kimi-K2-Instruct-0905,cobol-modernization,919.764676,True,0.6,True,919.764676 +82206198-4a21-4b5c-a190-7b53c7efdd9b,zai-org/GLM-4.5-Air-FP8,together_ai,break-filter-js-from-html,6875,8015,14890,424.310438,False,0.0,zai-org/GLM-4.5-Air-FP8,break-filter-js-from-html,424.310438,False,0.0,False,424.310438 +b01012d5-9bbb-4f15-a205-39120ca6a1d7,grok-4-0709,xai,pytorch-model-cli,11852,4340,16192,795.579642,True,1.0,grok-4-0709,pytorch-model-cli,795.579642,True,0.6,True,795.579642 +9c70a4c1-925e-43f4-8057-2fa47fcddf75,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-db-truncate,8007,2244,10251,277.26134,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-db-truncate,277.26134,False,0.0,False,277.26134 +c83a3078-238e-480c-bb8c-564027231f39,zai-org/GLM-4.5-Air-FP8,together_ai,schemelike-metacircular-eval,43718,39294,83012,2412.515906,False,0.0,zai-org/GLM-4.5-Air-FP8,schemelike-metacircular-eval,2412.515906,False,0.0,False,2412.515906 +5cc908a0-b8b0-4596-883e-30344ce209a9,grok-code-fast-1,xai,financial-document-processor,7751,2567,10318,328.287738,False,0.0,grok-code-fast-1,financial-document-processor,328.287738,False,0.0,False,328.287738 +2be63c7d-cac6-46a2-82cc-a5a745dc700c,gpt-5-nano,openai,build-pov-ray,18395,59805,78200,6000.001924,False,0.0,gpt-5-nano,build-pov-ray,6000.001924,False,0.0,False,6000.001924 +e6b5cecc-812d-43ed-a808-f36276f54b3e,OpenAI/gpt-oss-20B,together_ai,chess-best-move,453,603,1056,91.240332,False,0.0,OpenAI/gpt-oss-20B,chess-best-move,91.240332,False,0.0,False,91.240332 +b95070cc-959e-4171-b2a5-328186e6d775,gemini-2.5-flash,gemini,model-extraction-relu-logits,2175,2840,5015,202.07906,False,0.0,gemini-2.5-flash,model-extraction-relu-logits,202.07906,False,0.2,False,202.07906 +fa540284-c635-43d8-8eb0-e7e180023adc,gpt-5-mini,openai,pytorch-model-recovery,11718,11289,23007,809.873501,False,0.0,gpt-5-mini,pytorch-model-recovery,809.873501,False,0.0,False,809.873501 +c41afec4-6ea4-42fa-b4df-75657ceb36f4,moonshotai/Kimi-K2-Instruct-0905,together_ai,cancel-async-tasks,2586,2093,4679,131.481846,True,1.0,moonshotai/Kimi-K2-Instruct-0905,cancel-async-tasks,131.481846,True,0.6,True,131.481846 +63c9e862-a49c-4e58-b91c-411f2b72b19f,openai/gpt-oss-120b,together_ai,qemu-alpine-ssh,1461,1287,2748,323.99536,False,0.0,openai/gpt-oss-120b,qemu-alpine-ssh,323.99536,False,0.0,False,323.99536 +5db0491c-697e-405f-9164-a1258d139e01,openai/gpt-oss-120b,together_ai,model-extraction-relu-logits,1705,802,2507,298.438904,False,0.0,openai/gpt-oss-120b,model-extraction-relu-logits,298.438904,False,0.0,False,298.438904 +0e0a518a-f4e3-4459-be23-003886ce1e09,claude-opus-4-1-20250805,anthropic,password-recovery,6684,4886,11570,902.500883,True,1.0,claude-opus-4-1-20250805,password-recovery,902.500883,True,0.5555555555555556,True,902.500883 +04ac7774-e89b-4375-951c-ec9170f30284,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-alpine-ssh,1312,1047,2359,106.73237,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-alpine-ssh,106.73237,False,0.0,False,106.73237 +235801ab-a88a-4838-8e2d-d04988be3556,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,reverse-engineering,6253,3499,9752,230.139471,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reverse-engineering,230.139471,False,0.0,False,230.139471 +3659ca32-7816-423d-94ea-787521afc68b,openai/gpt-oss-120b,together_ai,qemu-startup,1204,974,2178,46.33987,False,0.0,openai/gpt-oss-120b,qemu-startup,46.33987,False,0.0,False,46.33987 +d3180dfd-7a50-456c-bba9-b4a5cdbf8dca,gpt-5-nano,openai,extract-elf,10891,5297,16188,562.913072,False,0.0,gpt-5-nano,extract-elf,562.913072,False,0.2,False,562.913072 +d7e84b9c-fb8d-4bd9-8792-5ba94104bba4,grok-code-fast-1,xai,install-klee-minimal,6106,1709,7815,908.998116,False,0.0,grok-code-fast-1,install-klee-minimal,908.998116,False,0.0,False,908.998116 +0af69304-388b-4d13-9bb5-5c4c68dc7e7a,gpt-5-nano,openai,pytorch-model-cli,2564,3147,5711,268.352405,False,0.0,gpt-5-nano,pytorch-model-cli,268.352405,False,0.0,False,268.352405 +5a891410-2c6b-4a56-9686-78ff09d5baf3,gpt-5-mini,openai,train-fasttext,16818,15772,32590,3627.221369,False,0.0,gpt-5-mini,train-fasttext,3627.221369,False,0.0,False,3627.221369 +1f869daf-56d3-4393-8e53-c986c3d92a13,grok-code-fast-1,xai,dna-insert,7749,2080,9829,170.686827,False,0.0,grok-code-fast-1,dna-insert,170.686827,False,0.0,False,170.686827 +737b8cc3-5e2e-468a-a50d-a22ee642b7fc,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-startup,1536,1583,3119,146.083293,True,1.0,moonshotai/Kimi-K2-Instruct-0905,qemu-startup,146.083293,True,0.4,True,146.083293 +221a7e3b-c57c-44b1-b91d-04ee856cd993,grok-4-0709,xai,filter-js-from-html,1094,584,1678,527.277799,False,0.0,grok-4-0709,filter-js-from-html,527.277799,False,0.0,False,527.277799 +a5bc764c-9b04-4ed7-bc2b-81d75b416966,OpenAI/gpt-oss-20B,together_ai,largest-eigenval,374,231,605,30.447841,False,0.0,OpenAI/gpt-oss-20B,largest-eigenval,30.447841,False,0.0,False,30.447841 +b6f91ed2-0f3d-426b-b2be-5913bcc21bb9,gpt-5-nano,openai,reverse-engineering,6184,7124,13308,1830.366763,False,0.0,gpt-5-nano,reverse-engineering,1830.366763,False,0.0,False,1830.366763 +c5319641-bdc5-4564-9cdf-45f510944655,gemini-2.5-flash,gemini,adaptive-rejection-sampler,11129,23159,34288,900.559728,False,0.0,gemini-2.5-flash,adaptive-rejection-sampler,900.559728,False,0.0,False,900.559728 +80f610d8-bf0d-400c-9585-8efee8808abc,openai/gpt-oss-120b,together_ai,crack-7z-hash,1223,748,1971,152.699364,False,0.0,openai/gpt-oss-120b,crack-7z-hash,152.699364,False,0.0,False,152.699364 +b14da1d4-649f-4ba6-a2b1-72aaeb523af0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-db-truncate,5682,4399,10081,459.544682,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-db-truncate,459.544682,False,0.0,False,459.544682 +a30b4630-c39e-4ad7-91a9-29e0810e4b08,moonshotai/Kimi-K2-Instruct-0905,together_ai,vulnerable-secret,2320,2919,5239,907.945944,False,0.0,moonshotai/Kimi-K2-Instruct-0905,vulnerable-secret,907.945944,False,0.2,False,907.945944 +d9f7fabe-ee30-4f99-ad6f-6cb263593be2,gemini-2.5-flash,gemini,regex-log,1349,785,2134,59.872783,True,1.0,gemini-2.5-flash,regex-log,59.872783,True,0.8,True,59.872783 +18da6fcd-bb39-44cb-931a-ce6c65725fc8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-ocaml-gc,32968,28608,61576,3613.109713,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-ocaml-gc,3613.109713,False,0.0,False,3613.109713 +26c91249-e0b4-4f73-83fa-ad08aad206d0,zai-org/GLM-4.5-Air-FP8,together_ai,log-summary-date-ranges,7248,2339,9587,81.057681,True,1.0,zai-org/GLM-4.5-Air-FP8,log-summary-date-ranges,81.057681,True,0.8,True,81.057681 +438fdb9a-f5fd-4e7a-937d-0dddb51d9a7f,moonshotai/Kimi-K2-Instruct-0905,together_ai,reverse-engineering,10405,5265,15670,2550.101008,False,0.0,moonshotai/Kimi-K2-Instruct-0905,reverse-engineering,2550.101008,False,0.2,False,2550.101008 +11bc9253-3243-4013-8211-37f5bb2ea246,openai/gpt-oss-120b,together_ai,make-doom-for-mips,18757,6318,25075,902.678084,False,0.0,openai/gpt-oss-120b,make-doom-for-mips,902.678084,False,0.0,False,902.678084 +9f4d21d1-32f3-4b7d-9aa2-6cfff96c74c8,gpt-5-mini,openai,run-pdp11-code,5829,3550,9379,693.143545,False,0.0,gpt-5-mini,run-pdp11-code,693.143545,False,0.0,False,693.143545 +8985e1bf-01b5-43f4-a9ab-e94ffcd5aa35,openai/gpt-oss-120b,together_ai,merge-diff-arc-agi-task,6432,3608,10040,206.437032,False,0.0,openai/gpt-oss-120b,merge-diff-arc-agi-task,206.437032,False,0.0,False,206.437032 +cde3bd3f-dda3-4702-a08a-4262816d2115,grok-code-fast-1,xai,build-pov-ray,14654,5733,20387,2396.423036,False,0.0,grok-code-fast-1,build-pov-ray,2396.423036,False,0.2,False,2396.423036 +51b82477-b3b9-4992-8b98-e28c1600dc68,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,torch-tensor-parallelism,3373,2437,5810,294.167971,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,torch-tensor-parallelism,294.167971,False,0.0,False,294.167971 +2eaca569-3442-4e32-a371-93c7e9f40804,grok-4-0709,xai,path-tracing,12345,4263,16608,1802.646409,False,0.0,grok-4-0709,path-tracing,1802.646409,False,0.0,False,1802.646409 +1284a529-edbb-4347-bd59-bd5493da2c4a,claude-opus-4-1-20250805,anthropic,adaptive-rejection-sampler,9967,3368,13335,2121.535579,False,0.0,claude-opus-4-1-20250805,adaptive-rejection-sampler,2121.535579,False,0.125,False,2121.535579 +e9da34a1-f7d9-4227-815d-fe46b4e225f2,gpt-5,openai,wasm-pipeline,8257,9642,17899,797.098302,True,1.0,gpt-5,wasm-pipeline,797.098302,True,1.0,True,797.098302 +37a74b29-e7a4-400b-a188-aace78c0d409,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing-reverse,6395,7040,13435,588.36258,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing-reverse,588.36258,False,0.0,False,588.36258 +1bb86b23-70b7-4ded-92b8-42089a80a6c2,gpt-5,openai,fix-code-vulnerability,8442,6960,15402,902.000882,False,0.0,gpt-5,fix-code-vulnerability,902.000882,False,0.0,False,902.000882 +010be9ab-f73d-4825-a6c3-20de731068c2,zai-org/GLM-4.5-Air-FP8,together_ai,break-filter-js-from-html,2444,2484,4928,166.897669,False,0.0,zai-org/GLM-4.5-Air-FP8,break-filter-js-from-html,166.897669,False,0.0,False,166.897669 +92461c80-eb60-482c-bb55-2bcc11051e5d,gpt-5,openai,gpt2-codegolf,3409,4838,8247,900.014797,False,0.0,gpt-5,gpt2-codegolf,900.014797,False,0.0,False,900.014797 +40b7f302-ba98-4531-9163-ea1f4de8db7f,OpenAI/gpt-oss-20B,together_ai,cobol-modernization,9875,17785,27660,914.721612,False,0.0,OpenAI/gpt-oss-20B,cobol-modernization,914.721612,False,0.0,False,914.721612 +b8900719-c08f-4987-a32b-10fdf84a0d7a,claude-opus-4-1-20250805,anthropic,polyglot-rust-c,8080,9358,17438,900.000976,False,0.0,claude-opus-4-1-20250805,polyglot-rust-c,900.000976,False,0.0,False,900.000976 +814a9719-ebd2-4a59-8318-b0403b0fbf2c,grok-code-fast-1,xai,vulnerable-secret,6414,3032,9446,188.613616,True,1.0,grok-code-fast-1,vulnerable-secret,188.613616,True,0.6,True,188.613616 +56c6266f-c920-4be4-9ef4-4f59c5c66f0f,claude-sonnet-4-20250514,anthropic,distribution-search,16100,14075,30175,1126.075232,False,0.0,claude-sonnet-4-20250514,distribution-search,1126.075232,False,0.6,False,1126.075232 +17da5b2b-eb9f-487b-b725-fe379680d6b1,grok-code-fast-1,xai,fix-code-vulnerability,7796,1935,9731,165.510629,False,0.0,grok-code-fast-1,fix-code-vulnerability,165.510629,False,0.0,False,165.510629 +15e42ae0-356b-4c05-a50d-28cbc6ae135f,grok-code-fast-1,xai,sqlite-db-truncate,12080,7057,19137,481.14695,False,0.0,grok-code-fast-1,sqlite-db-truncate,481.14695,False,0.0,False,481.14695 +0d7ff63f-b5ab-4cf2-8ec4-0848282919cf,claude-sonnet-4-20250514,anthropic,large-scale-text-editing,4097,3465,7562,483.641946,True,1.0,claude-sonnet-4-20250514,large-scale-text-editing,483.641946,True,0.6,True,483.641946 +2c36bc67-529e-4625-8780-881b2996ac0b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing-reverse,15001,9969,24970,1077.740802,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing-reverse,1077.740802,False,0.0,False,1077.740802 +a03d1eb8-1ef8-4993-beda-0d1aa75a858d,grok-code-fast-1,xai,build-pov-ray,15874,8814,24688,1235.74473,True,1.0,grok-code-fast-1,build-pov-ray,1235.74473,True,0.2,True,1235.74473 +ae0878f6-36f5-4c1a-8f5d-6a9c723bee52,gemini-2.5-pro,gemini,run-pdp11-code,6836,2332,9168,1123.358238,False,0.0,gemini-2.5-pro,run-pdp11-code,1123.358238,False,0.0,False,1123.358238 +f8d2d477-e5eb-49df-a9e8-69ffa83b56da,grok-4-0709,xai,fix-code-vulnerability,4973,3356,8329,900.000633,False,0.0,grok-4-0709,fix-code-vulnerability,900.000633,False,0.2,False,900.000633 +fe1ac5d2-7cbe-4703-8fd2-c437d053b0b9,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,schemelike-metacircular-eval,18845,21868,40713,1588.052894,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,schemelike-metacircular-eval,1588.052894,False,0.0,False,1588.052894 +289122a3-a0f6-4e6c-a79e-b5606784f55c,gpt-5-nano,openai,extract-elf,25763,10863,36626,900.607172,False,0.0,gpt-5-nano,extract-elf,900.607172,False,0.2,False,900.607172 +ce366a9d-36b9-4ad0-af44-038e7394fdf5,zai-org/GLM-4.5-Air-FP8,together_ai,cancel-async-tasks,1429,920,2349,27.84011,True,1.0,zai-org/GLM-4.5-Air-FP8,cancel-async-tasks,27.84011,True,0.2,True,27.84011 +0b4a8c07-7eaf-4b86-9b48-4f89a88128a3,openai/gpt-oss-120b,together_ai,pytorch-model-cli,1281,1423,2704,29.613396,False,0.0,openai/gpt-oss-120b,pytorch-model-cli,29.613396,False,0.0,False,29.613396 +6c916892-6d20-4cd3-b501-7c8f1d1f74aa,gpt-5-mini,openai,extract-elf,2198,1832,4030,155.241286,True,1.0,gpt-5-mini,extract-elf,155.241286,True,0.6,True,155.241286 +0629b921-5023-48da-9581-c09e07980824,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-mips-interpreter,27469,13411,40880,1839.633245,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-mips-interpreter,1839.633245,False,0.0,False,1839.633245 +81369027-9010-458b-af5b-d5ac49bcb60d,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-recovery,15286,9985,25271,912.948684,True,1.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-recovery,912.948684,True,0.4,True,912.948684 +d75bb81f-7dd7-4569-b344-14baa7831d09,claude-sonnet-4-20250514,anthropic,make-doom-for-mips,26524,7134,33658,901.964344,False,0.0,claude-sonnet-4-20250514,make-doom-for-mips,901.964344,False,0.0,False,901.964344 +0a61f64c-9b82-48ab-b4c9-17faab102bca,gemini-2.5-pro,gemini,pypi-server,7038,3268,10306,382.741979,False,0.0,gemini-2.5-pro,pypi-server,382.741979,False,0.8,False,382.741979 +b5e1b4c6-a8a3-4df9-8281-0b7b984fd07e,claude-sonnet-4-20250514,anthropic,build-pov-ray,18271,6692,24963,828.924243,True,1.0,claude-sonnet-4-20250514,build-pov-ray,828.924243,True,0.6,True,828.924243 +c1f3113e-4637-4c39-9267-d96e952c3130,claude-opus-4-1-20250805,anthropic,sqlite-db-truncate,6003,3825,9828,202.628815,False,0.0,claude-opus-4-1-20250805,sqlite-db-truncate,202.628815,False,0.125,False,202.628815 +9ce965b7-512c-447e-bd03-c41ac2746f4b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sanitize-git-repo,2935,1424,4359,436.979807,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sanitize-git-repo,436.979807,False,0.0,False,436.979807 +e9898836-4c94-4f10-a6d6-6153b9926f9e,deepseek-ai/DeepSeek-V3.1,together_ai,build-initramfs-qemu,10232,4632,14864,906.348501,False,0.0,deepseek-ai/DeepSeek-V3.1,build-initramfs-qemu,906.348501,False,0.0,False,906.348501 +836af897-cac7-46e5-8e3d-493af2a2cfd2,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-doom-for-mips,8816,1301,10117,1002.425557,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-doom-for-mips,1002.425557,False,0.0,False,1002.425557 +0db97972-77d7-4a28-86e6-8e25753e54ba,grok-code-fast-1,xai,sqlite-db-truncate,5956,4326,10282,700.449719,False,0.0,grok-code-fast-1,sqlite-db-truncate,700.449719,False,0.0,False,700.449719 +d48352a3-f11c-4fac-aee8-9443adb8a733,claude-opus-4-1-20250805,anthropic,cobol-modernization,6567,3798,10365,315.53184,True,1.0,claude-opus-4-1-20250805,cobol-modernization,315.53184,True,0.875,True,315.53184 +e8bd4d79-ab27-433a-9e3b-ec2eee0b6c43,deepseek-ai/DeepSeek-V3.1,together_ai,winning-avg-corewars,9711,8513,18224,580.508966,False,0.0,deepseek-ai/DeepSeek-V3.1,winning-avg-corewars,580.508966,False,0.0,False,580.508966 +6a84c62e-9b51-471b-800c-aabca5c0e2e4,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pov-ray,8199,2674,10873,388.846578,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pov-ray,388.846578,False,0.0,False,388.846578 +ab3bf2da-d401-4778-893e-6187b4f73086,openai/gpt-oss-120b,together_ai,write-compressor,1987,1680,3667,200.664599,False,0.0,openai/gpt-oss-120b,write-compressor,200.664599,False,0.0,False,200.664599 +99769767-447e-456d-a1a3-54952767b535,gpt-5-nano,openai,cobol-modernization,8249,5982,14231,902.784781,False,0.0,gpt-5-nano,cobol-modernization,902.784781,False,0.4,False,902.784781 +88a9cd3e-5be0-4bcb-8324-dd7580bf5a62,grok-4-0709,xai,make-mips-interpreter,16481,12609,29090,1803.162384,False,0.0,grok-4-0709,make-mips-interpreter,1803.162384,False,0.0,False,1803.162384 +860bd125-e82a-455d-a4f2-66778adfde77,deepseek-ai/DeepSeek-V3.1,together_ai,build-pov-ray,12010,17202,29212,2107.552499,False,0.0,deepseek-ai/DeepSeek-V3.1,build-pov-ray,2107.552499,False,0.4,False,2107.552499 +a15ad217-6647-4260-8cb8-0f49bf2ad5f3,zai-org/GLM-4.5-Air-FP8,together_ai,password-recovery,3591,10633,14224,761.301874,False,0.0,zai-org/GLM-4.5-Air-FP8,password-recovery,761.301874,False,0.0,False,761.301874 +82d01940-7c56-4554-aa39-595ae80879a5,OpenAI/gpt-oss-20B,together_ai,gpt2-codegolf,2386,9757,12143,910.717093,False,0.0,OpenAI/gpt-oss-20B,gpt2-codegolf,910.717093,False,0.0,False,910.717093 +19d933d3-b866-478f-aef3-141ad7f526bf,OpenAI/gpt-oss-20B,together_ai,regex-log,331,815,1146,152.851665,False,0.0,OpenAI/gpt-oss-20B,regex-log,152.851665,False,0.0,False,152.851665 +2fb59493-02c3-4696-a2ec-50353ae36f25,deepseek-ai/DeepSeek-V3.1,together_ai,circuit-fibsqrt,17295,17100,34395,3622.24772,False,0.0,deepseek-ai/DeepSeek-V3.1,circuit-fibsqrt,3622.24772,False,0.0,False,3622.24772 +09868f26-ef68-4ba2-92c2-2b4624a6902f,OpenAI/gpt-oss-20B,together_ai,dna-insert,2538,8553,11091,366.914253,False,0.0,OpenAI/gpt-oss-20B,dna-insert,366.914253,False,0.0,False,366.914253 +17ea7461-db60-4a35-ba2f-794a9f8f472f,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-linear-cryptanalysis,18689,18230,36919,1819.80891,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-linear-cryptanalysis,1819.80891,False,0.0,False,1819.80891 +3ae214fb-fee1-4a31-a18a-4933c307580d,moonshotai/Kimi-K2-Instruct-0905,together_ai,large-scale-text-editing,5362,4915,10277,1221.816872,False,0.0,moonshotai/Kimi-K2-Instruct-0905,large-scale-text-editing,1221.816872,False,0.0,False,1221.816872 +26bf9181-ac63-4d87-b8bf-acecea5eb090,gpt-5,openai,mteb-retrieve,1907,887,2794,315.698627,False,0.0,gpt-5,mteb-retrieve,315.698627,False,0.0,False,315.698627 +46a8f4a6-707e-46f4-b891-cbaadebe0613,OpenAI/gpt-oss-20B,together_ai,password-recovery,580,1546,2126,408.20545,False,0.0,OpenAI/gpt-oss-20B,password-recovery,408.20545,False,0.0,False,408.20545 +127905a6-5f28-4f57-b60c-99a8363c42f5,moonshotai/Kimi-K2-Instruct-0905,together_ai,run-pdp11-code,5856,4342,10198,1004.523248,False,0.0,moonshotai/Kimi-K2-Instruct-0905,run-pdp11-code,1004.523248,False,0.0,False,1004.523248 +aec7d125-de2a-4b3b-926f-7e168a8c803c,claude-opus-4-1-20250805,anthropic,largest-eigenval,17091,13149,30240,949.746904,False,0.0,claude-opus-4-1-20250805,largest-eigenval,949.746904,False,0.25,False,949.746904 +69c34280-4a18-4f7d-996f-adaf65ee29ba,claude-sonnet-4-20250514,anthropic,distribution-search,20358,17245,37603,1073.153483,False,0.0,claude-sonnet-4-20250514,distribution-search,1073.153483,False,0.6,False,1073.153483 +e8f24a2b-32b5-4992-82ed-07ed48d2fa10,grok-code-fast-1,xai,dna-assembly,6034,1547,7581,120.414696,False,0.0,grok-code-fast-1,dna-assembly,120.414696,False,0.0,False,120.414696 +3e3d44f8-ba48-4e70-b3d3-5f3a41ba121b,moonshotai/Kimi-K2-Instruct-0905,together_ai,train-fasttext,21431,15011,36442,3295.174305,False,0.0,moonshotai/Kimi-K2-Instruct-0905,train-fasttext,3295.174305,False,0.2,False,3295.174305 +c32a6678-a974-4a8c-82c0-8a9a3c702bf2,claude-sonnet-4-20250514,anthropic,extract-elf,8524,3856,12380,629.764203,False,0.0,claude-sonnet-4-20250514,extract-elf,629.764203,False,0.2,False,629.764203 +0a849189-66e1-4a06-b4a5-41812f1dd8db,OpenAI/gpt-oss-20B,together_ai,polyglot-c-py,397,682,1079,26.514535,False,0.0,OpenAI/gpt-oss-20B,polyglot-c-py,26.514535,False,0.0,False,26.514535 +11e3074d-709e-4241-923b-9d55a3e7789a,gemini-2.5-pro,gemini,vulnerable-secret,6657,3085,9742,254.776907,True,1.0,gemini-2.5-pro,vulnerable-secret,254.776907,True,0.8,True,254.776907 +c60cad39-d472-4511-bf76-1191ff3c6d33,gpt-5,openai,chess-best-move,9593,10386,19979,900.114747,False,0.0,gpt-5,chess-best-move,900.114747,False,0.0,False,900.114747 +0f5d7c35-30bd-4b76-8698-e7a9906affe5,zai-org/GLM-4.5-Air-FP8,together_ai,fix-ocaml-gc,41337,37391,78728,3614.86428,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-ocaml-gc,3614.86428,False,0.0,False,3614.86428 +ba1d22d4-6360-4662-afb7-21f3ebc062d8,gemini-2.5-pro,gemini,model-extraction-relu-logits,2416,2243,4659,537.082613,False,0.0,gemini-2.5-pro,model-extraction-relu-logits,537.082613,False,0.0,False,537.082613 +1906f849-da3a-4728-a22c-4a79ea4c7d0f,openai/gpt-oss-120b,together_ai,merge-diff-arc-agi-task,10563,5701,16264,272.444211,False,0.0,openai/gpt-oss-120b,merge-diff-arc-agi-task,272.444211,False,0.0,False,272.444211 +5fe43ab3-79df-4a1f-bce3-f78b5225b82d,claude-sonnet-4-20250514,anthropic,sqlite-db-truncate,5699,4044,9743,795.044249,False,0.0,claude-sonnet-4-20250514,sqlite-db-truncate,795.044249,False,0.0,False,795.044249 +870b8582-653b-4e67-a8e8-1848ce204ba5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sanitize-git-repo,6346,1637,7983,127.287694,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sanitize-git-repo,127.287694,False,0.0,False,127.287694 +6cd20851-258a-4dbb-8c63-3fe245907956,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-startup,2990,4652,7642,908.882791,False,0.0,zai-org/GLM-4.5-Air-FP8,qemu-startup,908.882791,False,0.2,False,908.882791 +db727f81-ca38-4bf5-8464-a9f1b7d3f610,gpt-5,openai,train-fasttext,13491,7750,21241,3624.595999,False,0.0,gpt-5,train-fasttext,3624.595999,False,0.0,False,3624.595999 +96448c0f-b062-41b5-9de1-1404ad727b96,gpt-5-mini,openai,financial-document-processor,3923,4040,7963,304.944171,False,0.0,gpt-5-mini,financial-document-processor,304.944171,False,0.0,False,304.944171 +3dab981b-4fff-4807-9f12-01005f0e3517,gpt-5-mini,openai,largest-eigenval,4455,3995,8450,919.798709,False,0.0,gpt-5-mini,largest-eigenval,919.798709,False,0.0,False,919.798709 +41c5dc24-dfae-4084-9527-668b34920f0a,openai/gpt-oss-120b,together_ai,write-compressor,1895,3630,5525,901.886255,False,0.0,openai/gpt-oss-120b,write-compressor,901.886255,False,0.0,False,901.886255 +688d7dc2-3636-4358-9a68-4241ee609984,claude-opus-4-1-20250805,anthropic,distribution-search,37140,43005,80145,3601.873857,False,0.0,claude-opus-4-1-20250805,distribution-search,3601.873857,False,0.5555555555555556,False,3601.873857 +2763ed6f-98bd-4067-86ed-61529e1be632,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-klee-minimal,13421,2562,15983,900.000675,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-klee-minimal,900.000675,False,0.0,False,900.000675 +f4e058fb-b6e6-4e75-8350-6c6322d9bc0c,claude-opus-4-1-20250805,anthropic,build-pov-ray,15926,3662,19588,1037.054903,True,1.0,claude-opus-4-1-20250805,build-pov-ray,1037.054903,True,0.75,True,1037.054903 +15f6e573-c7d8-48b9-be03-3c4ad4de283f,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pmars,14346,3479,17825,929.442623,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pmars,929.442623,False,0.2,False,929.442623 +702f9780-a0f8-465a-92ee-3bfac2848537,openai/gpt-oss-120b,together_ai,code-from-image,2580,4096,6676,163.994538,False,0.0,openai/gpt-oss-120b,code-from-image,163.994538,False,0.0,False,163.994538 +b3af42e9-65f6-4234-9ff0-2cefa8e50d48,OpenAI/gpt-oss-20B,together_ai,large-scale-text-editing,460,2000,2460,192.586515,False,0.0,OpenAI/gpt-oss-20B,large-scale-text-editing,192.586515,False,0.0,False,192.586515 +99406396-6b9a-474f-92bc-c372074309ba,grok-code-fast-1,xai,build-cython-ext,18348,4421,22769,705.459425,False,0.0,grok-code-fast-1,build-cython-ext,705.459425,False,0.0,False,705.459425 +9237f9fe-3088-417c-869c-844ba45a9a96,deepseek-ai/DeepSeek-V3.1,together_ai,pypi-server,3750,2035,5785,902.408906,True,1.0,deepseek-ai/DeepSeek-V3.1,pypi-server,902.408906,True,0.4,True,902.408906 +d175e902-714d-4be9-b80f-2a8bc23e3787,gemini-2.5-flash,gemini,log-summary-date-ranges,4113,5204,9317,214.425678,False,0.0,gemini-2.5-flash,log-summary-date-ranges,214.425678,False,0.0,False,214.425678 +f465839f-9d5d-493f-86ab-68a7290a1086,gpt-5,openai,build-cython-ext,11612,8666,20278,900.004222,False,0.0,gpt-5,build-cython-ext,900.004222,False,0.0,False,900.004222 +6af7418d-3806-44ee-908d-4dba724d2eb3,claude-sonnet-4-20250514,anthropic,distribution-search,10333,9673,20006,620.658975,True,1.0,claude-sonnet-4-20250514,distribution-search,620.658975,True,0.6,True,620.658975 +ee6c422e-845d-4fc0-baef-bc302c0d2430,gpt-5-nano,openai,build-cython-ext,21406,7446,28852,904.101111,False,0.0,gpt-5-nano,build-cython-ext,904.101111,False,0.0,False,904.101111 +3c6580cc-8ecb-40ed-b72d-5baca655ad05,deepseek-ai/DeepSeek-V3.1,together_ai,fix-ocaml-gc,47617,24000,71617,3612.920111,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-ocaml-gc,3612.920111,False,0.0,False,3612.920111 +0e35e7b5-4078-4351-aeb8-7b7fa71165a3,gemini-2.5-pro,gemini,run-pdp11-code,8516,4733,13249,1021.943654,False,0.0,gemini-2.5-pro,run-pdp11-code,1021.943654,False,0.0,False,1021.943654 +18a8c0ed-a138-457a-bc5f-e904f3654bc4,openai/gpt-oss-120b,together_ai,distribution-search,1982,2028,4010,102.519354,False,0.0,openai/gpt-oss-120b,distribution-search,102.519354,False,0.0,False,102.519354 +053c9289-db62-4e76-830f-ac9ddcfef8f5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-differential-cryptanalysis,2348,1228,3576,208.933573,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-differential-cryptanalysis,208.933573,False,0.0,False,208.933573 +45b2f304-ae64-45a4-8558-4e70379cd240,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,run-pdp11-code,5040,4896,9936,1002.416079,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,run-pdp11-code,1002.416079,False,0.0,False,1002.416079 +e0e6f36a-23fc-42b4-9179-df396a846625,moonshotai/Kimi-K2-Instruct-0905,together_ai,video-processing,5210,4524,9734,249.703665,False,0.0,moonshotai/Kimi-K2-Instruct-0905,video-processing,249.703665,False,0.0,False,249.703665 +ef6d7c00-6f76-4581-912b-022185de56d7,openai/gpt-oss-120b,together_ai,prove-plus-comm,3101,2344,5445,289.439585,True,1.0,openai/gpt-oss-120b,prove-plus-comm,289.439585,True,1.0,True,289.439585 +96138730-f61a-4694-90c5-cff3013f4fa4,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-c-py,3409,3196,6605,645.758931,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-c-py,645.758931,False,0.0,False,645.758931 +79545fd6-fa00-4dbb-9309-639a5af908da,gemini-2.5-flash,gemini,count-dataset-tokens,7687,2398,10085,369.28612,False,0.0,gemini-2.5-flash,count-dataset-tokens,369.28612,False,0.0,False,369.28612 +2ee959fe-3642-4857-99f6-1c5007862703,zai-org/GLM-4.5-Air-FP8,together_ai,winning-avg-corewars,21249,28100,49349,3606.37442,False,0.0,zai-org/GLM-4.5-Air-FP8,winning-avg-corewars,3606.37442,False,0.0,False,3606.37442 +cc708231-824a-4d53-9b07-ae7b75e66a77,moonshotai/Kimi-K2-Instruct-0905,together_ai,bn-fit-modify,21870,9210,31080,2868.985022,False,0.0,moonshotai/Kimi-K2-Instruct-0905,bn-fit-modify,2868.985022,False,0.0,False,2868.985022 +afc2284e-c651-4b9f-9a9a-11e1a11c4ed2,gpt-5,openai,crack-7z-hash,7880,3266,11146,544.140932,True,1.0,gpt-5,crack-7z-hash,544.140932,True,0.4285714285714285,True,544.140932 +cda59b89-db78-4d9e-b12d-dbff945f4f53,claude-sonnet-4-20250514,anthropic,build-pmars,14974,5872,20846,787.088101,True,1.0,claude-sonnet-4-20250514,build-pmars,787.088101,True,0.6,True,787.088101 +4d9729b9-11c3-47ff-9a6a-cc1b6581cd8a,claude-sonnet-4-20250514,anthropic,form-filling,6463,4597,11060,417.172156,True,1.0,claude-sonnet-4-20250514,form-filling,417.172156,True,1.0,True,417.172156 +e2647158-ab74-4739-9e45-7eac69decfdc,gemini-2.5-flash,gemini,build-pov-ray,6507,9515,16022,1089.011571,False,0.0,gemini-2.5-flash,build-pov-ray,1089.011571,False,0.0,False,1089.011571 +cf28343f-8e72-46de-a10c-71f2af7e5b44,gemini-2.5-flash,gemini,install-windows-3.11,4767,2722,7489,127.662313,False,0.0,gemini-2.5-flash,install-windows-3.11,127.662313,False,0.0,False,127.662313 +da870387-d393-45d9-a4d9-aae3f8e0b20f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing-reverse,18502,11338,29840,1011.309079,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing-reverse,1011.309079,False,0.0,False,1011.309079 +77dbb26b-f9e8-4986-a7c6-b5a082d9434b,gpt-5-nano,openai,nginx-request-logging,10446,7567,18013,949.775719,False,0.0,gpt-5-nano,nginx-request-logging,949.775719,False,0.0,False,949.775719 +800d390a-d43c-4908-8946-44bd5f7d9c7d,gemini-2.5-flash,gemini,financial-document-processor,8139,2557,10696,1217.995469,False,0.0,gemini-2.5-flash,financial-document-processor,1217.995469,False,0.0,False,1217.995469 +fb19a7eb-c94a-4961-9628-b9095bb41d22,gpt-5,openai,make-doom-for-mips,10311,6567,16878,900.011283,False,0.0,gpt-5,make-doom-for-mips,900.011283,False,0.0,False,900.011283 +b34aed8e-0c82-4b4e-a774-efb8bf69a22e,gemini-2.5-flash,gemini,break-filter-js-from-html,1951,1534,3485,127.737458,False,0.0,gemini-2.5-flash,break-filter-js-from-html,127.737458,False,0.0,False,127.737458 +9e9a2d24-9b23-4a95-a8e1-2cb8ef75fbe5,grok-code-fast-1,xai,build-initramfs-qemu,2446,1767,4213,37.845297,False,0.0,grok-code-fast-1,build-initramfs-qemu,37.845297,False,0.0,False,37.845297 +2715c613-1d22-4b6f-8082-af675a5fe2a2,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-doom-for-mips,22219,5864,28083,908.134936,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-doom-for-mips,908.134936,False,0.0,False,908.134936 +a799dc74-2b21-4dc4-9676-f2ec02d46b72,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-retrieve,2410,1285,3695,195.511405,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-retrieve,195.511405,False,0.0,False,195.511405 +22caa237-7018-49d7-99a9-439d403fa56b,openai/gpt-oss-120b,together_ai,build-initramfs-qemu,1361,1264,2625,136.322567,False,0.0,openai/gpt-oss-120b,build-initramfs-qemu,136.322567,False,0.0,False,136.322567 +8db9717c-a718-467c-93bb-521575401644,claude-sonnet-4-20250514,anthropic,mteb-leaderboard,1203,816,2019,58.604664,False,0.0,claude-sonnet-4-20250514,mteb-leaderboard,58.604664,False,0.0,False,58.604664 +b6334679-32dd-436d-b06a-ac0d492406d9,openai/gpt-oss-120b,together_ai,code-from-image,14112,3254,17366,315.091059,False,0.0,openai/gpt-oss-120b,code-from-image,315.091059,False,0.0,False,315.091059 +c3ed7dfe-8950-4c58-a920-18ea42883f59,grok-code-fast-1,xai,tune-mjcf,4092,2629,6721,333.922923,True,1.0,grok-code-fast-1,tune-mjcf,333.922923,True,0.4,True,333.922923 +c47de1c0-bc5a-41b2-8119-96cef019fd54,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,model-extraction-relu-logits,1407,1816,3223,194.910346,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,model-extraction-relu-logits,194.910346,False,0.0,False,194.910346 +15f0d58b-0edb-4c13-bd1a-d9e1b744c036,openai/gpt-oss-120b,together_ai,mteb-leaderboard,1151,904,2055,62.592313,False,0.0,openai/gpt-oss-120b,mteb-leaderboard,62.592313,False,0.0,False,62.592313 +4edc8459-8675-459f-a195-a3a956bbc1c2,claude-opus-4-1-20250805,anthropic,filter-js-from-html,11007,8833,19840,687.531898,False,0.0,claude-opus-4-1-20250805,filter-js-from-html,687.531898,False,0.0,False,687.531898 +08ef2ddf-b5c6-4163-9e27-841c4c06876e,claude-sonnet-4-20250514,anthropic,sparql-university,3847,1086,4933,1013.533783,False,0.0,claude-sonnet-4-20250514,sparql-university,1013.533783,False,0.0,False,1013.533783 +6004a4b8-5eec-43eb-b873-52da8fd9381a,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-recovery,20965,15298,36263,900.051785,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-recovery,900.051785,False,0.4,False,900.051785 +69c75112-05e5-45e8-8986-73703ce702b6,grok-4-0709,xai,merge-diff-arc-agi-task,7145,1998,9143,902.316225,False,0.0,grok-4-0709,merge-diff-arc-agi-task,902.316225,False,0.4,False,902.316225 +76f5c077-dde5-4026-837f-1acfe41f861d,OpenAI/gpt-oss-20B,together_ai,build-cython-ext,7015,20933,27948,900.035396,False,0.0,OpenAI/gpt-oss-20B,build-cython-ext,900.035396,False,0.0,False,900.035396 +395884b6-086c-449b-b11a-154a70c69e32,deepseek-ai/DeepSeek-V3.1,together_ai,configure-git-webserver,5353,1447,6800,335.815698,True,1.0,deepseek-ai/DeepSeek-V3.1,configure-git-webserver,335.815698,True,1.0,True,335.815698 +0220641a-d71e-4f0a-8291-a2593b84812b,claude-opus-4-1-20250805,anthropic,mteb-retrieve,2135,1327,3462,51.32253,False,0.0,claude-opus-4-1-20250805,mteb-retrieve,51.32253,False,0.0,False,51.32253 +365dcd78-ce12-44a0-8d2b-99d43db43394,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,log-summary-date-ranges,10645,5108,15753,393.691667,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,log-summary-date-ranges,393.691667,True,0.8,True,393.691667 +9c19395b-df4b-4347-bf84-cdf2065c6b3e,grok-code-fast-1,xai,crack-7z-hash,9294,4946,14240,907.556997,False,0.0,grok-code-fast-1,crack-7z-hash,907.556997,False,0.6,False,907.556997 +3b29e901-6502-4d4c-b0f1-4233f59c9cba,deepseek-ai/DeepSeek-V3.1,together_ai,write-compressor,10303,9604,19907,598.722451,False,0.0,deepseek-ai/DeepSeek-V3.1,write-compressor,598.722451,False,0.0,False,598.722451 +88b81eb6-e2b1-49e1-8042-7a15cd8b2d09,gemini-2.5-pro,gemini,path-tracing-reverse,18959,16501,35460,1835.024521,False,0.0,gemini-2.5-pro,path-tracing-reverse,1835.024521,False,0.0,False,1835.024521 +985d75a0-5a87-4fa4-a136-910a8413bb30,gpt-5,openai,merge-diff-arc-agi-task,9071,4429,13500,524.795835,True,1.0,gpt-5,merge-diff-arc-agi-task,524.795835,True,1.0,True,524.795835 +f8dfcd45-b710-4072-b509-82c145e95350,grok-4-0709,xai,reverse-engineering,6779,3654,10433,2616.468792,False,0.0,grok-4-0709,reverse-engineering,2616.468792,False,0.2,False,2616.468792 +d0d3874e-d84c-4023-98a6-442a6a108422,openai/gpt-oss-120b,together_ai,feal-linear-cryptanalysis,9906,8708,18614,522.078941,False,0.0,openai/gpt-oss-120b,feal-linear-cryptanalysis,522.078941,False,0.4,False,522.078941 +170f4cfc-67c0-4bae-b338-b454fa9c9dd0,gpt-5,openai,polyglot-rust-c,2733,2615,5348,921.104387,False,0.0,gpt-5,polyglot-rust-c,921.104387,False,0.0,False,921.104387 +ef7ae628-13fc-4d17-bcf2-69199b854edf,claude-sonnet-4-20250514,anthropic,feal-linear-cryptanalysis,24627,21313,45940,1800.015578,False,0.0,claude-sonnet-4-20250514,feal-linear-cryptanalysis,1800.015578,False,0.0,False,1800.015578 +c9c3597b-0e71-44a6-a06e-f8939153956a,claude-opus-4-1-20250805,anthropic,pytorch-model-recovery,7580,4605,12185,192.191495,True,1.0,claude-opus-4-1-20250805,pytorch-model-recovery,192.191495,True,1.0,True,192.191495 +663f4f86-68cb-44d8-8093-5994321c1fb5,openai/gpt-oss-120b,together_ai,build-pov-ray,9988,3054,13042,1171.269573,False,0.0,openai/gpt-oss-120b,build-pov-ray,1171.269573,False,0.0,False,1171.269573 +fa4d063d-1cbc-44d5-8840-fcf35d6accd9,grok-code-fast-1,xai,sparql-university,4806,1450,6256,142.972353,False,0.0,grok-code-fast-1,sparql-university,142.972353,False,0.2,False,142.972353 +bbe7d28a-4681-4069-a6e6-89afd10b8cdc,gemini-2.5-flash,gemini,vulnerable-secret,7730,30882,38612,907.595431,False,0.0,gemini-2.5-flash,vulnerable-secret,907.595431,False,0.0,False,907.595431 +332fda31-b86e-48ec-9534-4476b6259ac2,claude-opus-4-1-20250805,anthropic,log-summary-date-ranges,7282,1460,8742,82.01714,False,0.0,claude-opus-4-1-20250805,log-summary-date-ranges,82.01714,False,0.8888888888888888,False,82.01714 +0f5b59f4-62d2-4ca9-880d-d689c3ba5736,grok-4-0709,xai,mteb-retrieve,2760,2040,4800,508.654613,False,0.0,grok-4-0709,mteb-retrieve,508.654613,False,0.0,False,508.654613 +735b85e1-43ce-4cab-bd9a-5be2a1441d5c,claude-opus-4-1-20250805,anthropic,db-wal-recovery,7594,6667,14261,500.045358,False,0.0,claude-opus-4-1-20250805,db-wal-recovery,500.045358,False,0.0,False,500.045358 +2f042871-257d-4970-afd8-a566d86676a0,gemini-2.5-pro,gemini,break-filter-js-from-html,5027,4734,9761,977.348113,True,1.0,gemini-2.5-pro,break-filter-js-from-html,977.348113,True,0.2,True,977.348113 +8ac03aaf-6f58-4c7f-a77e-f77bc85c9faa,zai-org/GLM-4.5-Air-FP8,together_ai,fix-ocaml-gc,40990,25853,66843,2787.353902,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-ocaml-gc,2787.353902,False,0.0,False,2787.353902 +b01af900-ff04-4e4a-b965-3b825a949c84,claude-sonnet-4-20250514,anthropic,fix-ocaml-gc,46819,19723,66542,3611.41212,False,0.0,claude-sonnet-4-20250514,fix-ocaml-gc,3611.41212,False,0.0,False,3611.41212 +41f57a35-8638-4ee8-ba5e-e86de07b3275,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-retrieve,1504,1375,2879,56.006153,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-retrieve,56.006153,False,0.0,False,56.006153 +71d1aa7d-b7b6-40ec-bc4d-1bc3524df738,gemini-2.5-flash,gemini,run-pdp11-code,5858,1498,7356,201.115824,False,0.0,gemini-2.5-flash,run-pdp11-code,201.115824,False,0.0,False,201.115824 +241c821d-3cf7-4a42-96cd-b552663cf3a6,gpt-5,openai,sanitize-git-repo,10355,6775,17130,551.618061,False,0.0,gpt-5,sanitize-git-repo,551.618061,False,0.2857142857142857,False,551.618061 +c7ce51aa-46ee-48b7-babb-5fc0562d9331,moonshotai/Kimi-K2-Instruct-0905,together_ai,distribution-search,8580,7995,16575,1127.574018,False,0.0,moonshotai/Kimi-K2-Instruct-0905,distribution-search,1127.574018,False,0.2,False,1127.574018 +13869209-40bb-4e17-9b0a-7b90030c28c9,openai/gpt-oss-120b,together_ai,count-dataset-tokens,1676,1453,3129,243.517091,False,0.0,openai/gpt-oss-120b,count-dataset-tokens,243.517091,False,0.0,False,243.517091 +8343a0c3-2e37-4db1-8fcf-38e5d8ec53c0,gemini-2.5-pro,gemini,break-filter-js-from-html,1946,1630,3576,346.544619,False,0.0,gemini-2.5-pro,break-filter-js-from-html,346.544619,False,0.2,False,346.544619 +049de1a0-a73b-4a1f-8dd4-fc6e15cd3155,grok-4-0709,xai,pytorch-model-recovery,6540,5220,11760,909.795331,False,0.0,grok-4-0709,pytorch-model-recovery,909.795331,False,0.2,False,909.795331 +e3234ee1-58a6-4294-a6a0-f096ac936ab3,gemini-2.5-pro,gemini,sanitize-git-repo,10454,1694,12148,142.291642,False,0.0,gemini-2.5-pro,sanitize-git-repo,142.291642,False,0.0,False,142.291642 +08fe0f55-973a-4ff6-8852-e2fa4abd7068,claude-opus-4-1-20250805,anthropic,fix-git,3008,1886,4894,82.930545,True,1.0,claude-opus-4-1-20250805,fix-git,82.930545,True,1.0,True,82.930545 +33d4e41d-b94e-4694-b922-4e9ead335775,grok-4-0709,xai,cobol-modernization,4401,2622,7023,914.904313,False,0.0,grok-4-0709,cobol-modernization,914.904313,False,0.2,False,914.904313 +5a1ada2c-70ec-4daf-9f8d-de86b690f113,grok-4-0709,xai,run-pdp11-code,763,250,1013,1007.772376,False,0.0,grok-4-0709,run-pdp11-code,1007.772376,False,0.0,False,1007.772376 +27dd78d5-f4f2-493c-8ee1-f0c75fb92e88,moonshotai/Kimi-K2-Instruct-0905,together_ai,form-filling,7107,5714,12821,327.209381,True,1.0,moonshotai/Kimi-K2-Instruct-0905,form-filling,327.209381,True,0.8,True,327.209381 +ed4880a9-6368-49f7-a946-3844e2cffcb4,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,configure-git-webserver,14444,2905,17349,811.789377,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,configure-git-webserver,811.789377,False,0.6,False,811.789377 +c82a7958-26c2-41fe-9307-8fb583d2ade4,deepseek-ai/DeepSeek-V3.1,together_ai,fix-git,15842,5248,21090,916.094816,True,1.0,deepseek-ai/DeepSeek-V3.1,fix-git,916.094816,True,0.8,True,916.094816 +8993c076-aa77-4659-80e7-3b742204c767,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,winning-avg-corewars,10423,8434,18857,777.603079,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,winning-avg-corewars,777.603079,False,0.0,False,777.603079 +4a627791-94be-48e9-a2d7-3b34944e2fc6,deepseek-ai/DeepSeek-V3.1,together_ai,distribution-search,21463,16010,37473,1203.850305,False,0.0,deepseek-ai/DeepSeek-V3.1,distribution-search,1203.850305,False,0.0,False,1203.850305 +f87c9eb5-d29a-4370-ab86-5ce30b1686b6,zai-org/GLM-4.5-Air-FP8,together_ai,db-wal-recovery,2219,2929,5148,120.651215,False,0.0,zai-org/GLM-4.5-Air-FP8,db-wal-recovery,120.651215,False,0.0,False,120.651215 +77741cd1-a259-4917-b33c-4dd85aae21cf,gpt-5,openai,build-pov-ray,40008,34830,74838,4502.348002,False,0.0,gpt-5,build-pov-ray,4502.348002,False,0.0,False,4502.348002 +28a9158a-9005-4996-a870-e363a30af346,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,port-compressor,27823,14550,42373,3606.503901,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,port-compressor,3606.503901,False,0.0,False,3606.503901 +49eea92a-499a-403b-a601-f3925dd97902,gemini-2.5-flash,gemini,cobol-modernization,12800,13021,25821,914.479715,False,0.0,gemini-2.5-flash,cobol-modernization,914.479715,False,0.2,False,914.479715 +a0021cd1-27b7-40af-beb5-95c435a72b9d,OpenAI/gpt-oss-20B,together_ai,install-klee-minimal,4089,1480,5569,507.812452,False,0.0,OpenAI/gpt-oss-20B,install-klee-minimal,507.812452,False,0.0,False,507.812452 +9a5af79d-fb5c-4d63-88cb-a176b53e86b8,gpt-5-mini,openai,distribution-search,9629,10817,20446,1309.206797,True,1.0,gpt-5-mini,distribution-search,1309.206797,True,1.0,True,1309.206797 +d867c87b-0ff2-457c-8f8e-abf34cd9e4a7,moonshotai/Kimi-K2-Instruct-0905,together_ai,reverse-engineering,10650,10766,21416,1801.947719,False,0.0,moonshotai/Kimi-K2-Instruct-0905,reverse-engineering,1801.947719,False,0.2,False,1801.947719 +cb0a7daf-a664-4f7d-868b-8a93287a02fa,gemini-2.5-pro,gemini,make-mips-interpreter,17835,17966,35801,1804.875428,False,0.0,gemini-2.5-pro,make-mips-interpreter,1804.875428,False,0.0,False,1804.875428 +3b796342-349c-4df3-9f6a-945109d63b02,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,winning-avg-corewars,19975,19190,39165,3617.791612,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,winning-avg-corewars,3617.791612,False,0.0,False,3617.791612 +5521ae71-8218-46ff-be18-bf4bf78cf3ae,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,wasm-pipeline,9940,3887,13827,668.711147,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,wasm-pipeline,668.711147,True,0.6,True,668.711147 +5956c3d0-735d-436a-896c-fa99ec7b8f72,gpt-5-mini,openai,reshard-c4-data,1617,2737,4354,486.908328,False,0.0,gpt-5-mini,reshard-c4-data,486.908328,False,0.0,False,486.908328 +7cfa567b-4e73-46e0-b0e2-837968b4c4ac,gpt-5,openai,model-extraction-relu-logits,7110,3900,11010,292.679044,False,0.0,gpt-5,model-extraction-relu-logits,292.679044,False,0.1666666666666666,False,292.679044 +3eaaeeef-de36-4695-960b-3559aa485b32,gpt-5-mini,openai,distribution-search,7571,6049,13620,863.045016,True,1.0,gpt-5-mini,distribution-search,863.045016,True,1.0,True,863.045016 +11f477db-b168-4c19-96ae-5f8efc0f5313,openai/gpt-oss-120b,together_ai,constraints-scheduling,7235,8886,16121,451.557666,True,1.0,openai/gpt-oss-120b,constraints-scheduling,451.557666,True,1.0,True,451.557666 +7c8dc744-ee69-4a0a-bcde-b49bc6706b54,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-ocaml-gc,38271,21696,59967,2571.597242,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-ocaml-gc,2571.597242,False,0.0,False,2571.597242 +064cef09-19de-46a2-bc45-6e9f67524e7f,openai/gpt-oss-120b,together_ai,adaptive-rejection-sampler,5033,2699,7732,217.827978,False,0.0,openai/gpt-oss-120b,adaptive-rejection-sampler,217.827978,False,0.0,False,217.827978 +448acebb-68b4-4032-b948-f7c071e56d09,gemini-2.5-pro,gemini,count-dataset-tokens,15570,3983,19553,900.227218,False,0.0,gemini-2.5-pro,count-dataset-tokens,900.227218,False,0.0,False,900.227218 +a3063373-c247-457e-a89d-3a401eec3143,gpt-5,openai,install-klee-minimal,7724,3592,11316,900.007161,False,0.0,gpt-5,install-klee-minimal,900.007161,False,0.0,False,900.007161 +1d2345d6-e057-4f24-8e65-8790edce7774,grok-code-fast-1,xai,financial-document-processor,5710,2072,7782,331.041978,False,0.0,grok-code-fast-1,financial-document-processor,331.041978,False,0.0,False,331.041978 +0787e74e-4c3c-43af-8e84-fa92fbbc8d38,gemini-2.5-flash,gemini,sqlite-with-gcov,1489,1150,2639,164.43347,False,0.0,gemini-2.5-flash,sqlite-with-gcov,164.43347,False,0.2,False,164.43347 +cd9cffee-c3dc-43eb-9b49-90bf814d6d4b,deepseek-ai/DeepSeek-V3.1,together_ai,feal-differential-cryptanalysis,2178,1284,3462,121.222539,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-differential-cryptanalysis,121.222539,False,0.0,False,121.222539 +58af9857-e3f3-47f7-b901-253f35c7eed7,gpt-5-mini,openai,qemu-startup,1920,1547,3467,649.734081,True,1.0,gpt-5-mini,qemu-startup,649.734081,True,0.8,True,649.734081 +d469004d-7c96-4869-bdb3-32a99db4bad8,deepseek-ai/DeepSeek-V3.1,together_ai,financial-document-processor,12778,5978,18756,448.614275,False,0.0,deepseek-ai/DeepSeek-V3.1,financial-document-processor,448.614275,False,0.0,False,448.614275 +990c5dd9-1fd5-478d-91c0-0c15e695b74a,gpt-5-nano,openai,cancel-async-tasks,1579,1039,2618,460.080179,False,0.0,gpt-5-nano,cancel-async-tasks,460.080179,False,0.4,False,460.080179 +2a08416e-f896-4c8d-ade4-91265fcb5079,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,vulnerable-secret,3332,3950,7282,286.823811,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,vulnerable-secret,286.823811,False,0.0,False,286.823811 +6e48cdd4-fb0b-4d1c-a01e-28d6231d3fba,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,train-fasttext,22792,5296,28088,865.611724,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,train-fasttext,865.611724,False,0.0,False,865.611724 +eb19de81-6235-4257-9e0f-26468b1e4d7f,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,write-compressor,1570,1974,3544,59.24247,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,write-compressor,59.24247,False,0.0,False,59.24247 +6c0adec2-25b3-484d-9bb6-ab8486aba1fe,gpt-5-mini,openai,mteb-leaderboard,46336,39151,85487,3600.507909,False,0.0,gpt-5-mini,mteb-leaderboard,3600.507909,False,0.0,False,3600.507909 +89694e03-4fb7-4755-a838-09aa918f8bbe,gpt-5,openai,winning-avg-corewars,32579,34028,66607,3603.644069,False,0.0,gpt-5,winning-avg-corewars,3603.644069,False,0.2857142857142857,False,3603.644069 +3912ab41-b86a-478e-a5af-995eabc2ce0d,gpt-5-mini,openai,regex-log,1704,1353,3057,173.350422,False,0.0,gpt-5-mini,regex-log,173.350422,False,0.8,False,173.350422 +8051cf7f-2de6-4865-9cf9-dc1973d1ee78,grok-4-0709,xai,fix-git,1845,1327,3172,167.355702,True,1.0,grok-4-0709,fix-git,167.355702,True,1.0,True,167.355702 +beb317dd-8cc0-4cd5-8fe2-49dbe4bfcbb8,gemini-2.5-pro,gemini,mteb-leaderboard,31570,20424,51994,2762.811167,False,0.0,gemini-2.5-pro,mteb-leaderboard,2762.811167,False,0.0,False,2762.811167 +c80ab1b4-fece-438c-bb05-c636e0237956,claude-opus-4-1-20250805,anthropic,sanitize-git-repo,12823,3486,16309,903.693157,False,0.0,claude-opus-4-1-20250805,sanitize-git-repo,903.693157,False,0.0,False,903.693157 +c0203012-10f5-4e91-9ad3-268898886a47,gpt-5,openai,code-from-image,21537,21802,43339,1201.63056,False,0.0,gpt-5,code-from-image,1201.63056,False,0.4,False,1201.63056 +802d403e-5284-4a8f-9d89-bbb6008a6805,claude-opus-4-1-20250805,anthropic,extract-elf,6263,2957,9220,128.555051,True,1.0,claude-opus-4-1-20250805,extract-elf,128.555051,True,0.8888888888888888,True,128.555051 +967d02f3-8d5f-4599-aa55-2aca50b999e0,OpenAI/gpt-oss-20B,together_ai,sqlite-db-truncate,559,829,1388,49.392669,False,0.0,OpenAI/gpt-oss-20B,sqlite-db-truncate,49.392669,False,0.0,False,49.392669 +c5a38b9b-a3d9-49c3-b015-7882f2476bdf,zai-org/GLM-4.5-Air-FP8,together_ai,sanitize-git-repo,13286,3973,17259,549.336437,False,0.0,zai-org/GLM-4.5-Air-FP8,sanitize-git-repo,549.336437,False,0.0,False,549.336437 +7736d7f7-7c2c-4cf3-93ae-69259fcbd531,gemini-2.5-pro,gemini,hf-model-inference,6488,2157,8645,409.329734,False,0.0,gemini-2.5-pro,hf-model-inference,409.329734,False,0.8,False,409.329734 +0f818b21-1780-46f0-a8f4-82fcbacddb4b,grok-4-0709,xai,constraints-scheduling,5912,4163,10075,1101.814021,True,1.0,grok-4-0709,constraints-scheduling,1101.814021,True,0.8,True,1101.814021 +e11f644c-e4e6-41ae-a36f-a95f138e6e40,grok-4-0709,xai,polyglot-c-py,0,0,0,902.57269,False,0.0,grok-4-0709,polyglot-c-py,902.57269,False,0.6,False,902.57269 +c61f5f26-8447-4932-9d30-640e19eaf9a3,moonshotai/Kimi-K2-Instruct-0905,together_ai,vulnerable-secret,1720,2017,3737,910.738663,False,0.0,moonshotai/Kimi-K2-Instruct-0905,vulnerable-secret,910.738663,False,0.2,False,910.738663 +7c99ef96-5e2d-4153-b333-b974b4b93aa4,gemini-2.5-flash,gemini,sqlite-db-truncate,4256,8125,12381,408.856252,False,0.0,gemini-2.5-flash,sqlite-db-truncate,408.856252,False,0.0,False,408.856252 +6085883a-4110-4a6a-ae71-c0ee2b946f65,gpt-5-mini,openai,sparql-university,10105,6338,16443,499.63291,False,0.0,gpt-5-mini,sparql-university,499.63291,False,0.0,False,499.63291 +cbcce4de-0ee3-47a5-a9d8-0bcf92ddb92c,gpt-5,openai,count-dataset-tokens,9388,6449,15837,650.136885,False,0.0,gpt-5,count-dataset-tokens,650.136885,False,0.1666666666666666,False,650.136885 +1321e30a-e0d9-49de-820e-1d7e4daed94a,grok-4-0709,xai,regex-log,1252,842,2094,302.33619,False,0.0,grok-4-0709,regex-log,302.33619,False,0.6,False,302.33619 +da8185e9-c7cd-4580-87cc-126d4d3ff0ba,deepseek-ai/DeepSeek-V3.1,together_ai,constraints-scheduling,5518,3738,9256,357.755916,True,1.0,deepseek-ai/DeepSeek-V3.1,constraints-scheduling,357.755916,True,0.8,True,357.755916 +f103b773-8968-4255-8010-51bd4d12d885,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-rust-c,7348,7249,14597,934.293,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-rust-c,934.293,False,0.0,False,934.293 +7fe934b6-ce99-462a-a33e-48d88b051ad4,openai/gpt-oss-120b,together_ai,count-dataset-tokens,6124,3898,10022,428.644218,False,0.0,openai/gpt-oss-120b,count-dataset-tokens,428.644218,False,0.0,False,428.644218 +32847b81-c54f-40ef-aea3-69e7c59819a2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-db-truncate,3767,2165,5932,102.045474,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-db-truncate,102.045474,False,0.0,False,102.045474 +c431d136-1735-4b85-bbd2-beded79c9b39,gpt-5-mini,openai,qemu-startup,4584,4563,9147,812.293778,True,1.0,gpt-5-mini,qemu-startup,812.293778,True,0.8,True,812.293778 +6267cf5f-7f9a-4f2c-b56c-e743cb848131,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cancel-async-tasks,1297,785,2082,70.058497,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cancel-async-tasks,70.058497,True,0.8,True,70.058497 +b3750943-d6ab-41d7-a756-aa7997b84b1c,grok-code-fast-1,xai,largest-eigenval,9633,6624,16257,905.303051,False,0.0,grok-code-fast-1,largest-eigenval,905.303051,False,0.0,False,905.303051 +4670eee4-4547-481a-bd56-f3653ad4dcc3,gpt-5-nano,openai,code-from-image,16319,11177,27496,1222.466232,False,0.0,gpt-5-nano,code-from-image,1222.466232,False,0.0,False,1222.466232 +5804a8e2-432a-45e9-8c15-2a038a5549bd,grok-4-0709,xai,polyglot-rust-c,0,0,0,900.109638,False,0.0,grok-4-0709,polyglot-rust-c,900.109638,False,0.0,False,900.109638 +ff385be5-f800-4056-8b58-f3ea781588b1,gpt-5-nano,openai,build-initramfs-qemu,8089,5534,13623,900.007355,False,0.0,gpt-5-nano,build-initramfs-qemu,900.007355,False,0.0,False,900.007355 +78902d80-ee98-4957-be60-3963d6b9553a,gemini-2.5-pro,gemini,merge-diff-arc-agi-task,8669,3040,11709,870.074649,False,0.0,gemini-2.5-pro,merge-diff-arc-agi-task,870.074649,False,0.6,False,870.074649 +b76be109-c175-4aa4-9fcc-ad35c48685ca,grok-4-0709,xai,pytorch-model-recovery,5969,4397,10366,900.0293,False,0.0,grok-4-0709,pytorch-model-recovery,900.0293,False,0.2,False,900.0293 +0140c865-fe86-4646-a5dd-27a9ff1abfca,gemini-2.5-pro,gemini,build-pov-ray,16160,3114,19274,571.150078,True,1.0,gemini-2.5-pro,build-pov-ray,571.150078,True,1.0,True,571.150078 +d03e12ad-c390-48a4-a362-91ee2387ff17,moonshotai/Kimi-K2-Instruct-0905,together_ai,adaptive-rejection-sampler,15112,9802,24914,903.530692,False,0.0,moonshotai/Kimi-K2-Instruct-0905,adaptive-rejection-sampler,903.530692,False,0.0,False,903.530692 +e9b5848b-52fc-4b61-8203-242f2fde4b19,claude-opus-4-1-20250805,anthropic,port-compressor,59589,43135,102724,3613.633762,False,0.0,claude-opus-4-1-20250805,port-compressor,3613.633762,False,0.0,False,3613.633762 +0008e336-0b20-40c1-a7b7-171a24dedb1e,claude-opus-4-1-20250805,anthropic,break-filter-js-from-html,26423,24301,50724,1200.000446,False,0.0,claude-opus-4-1-20250805,break-filter-js-from-html,1200.000446,False,0.2222222222222222,False,1200.000446 +e972881c-6cea-4ec9-b84d-837fc49c8a5a,gpt-5-nano,openai,path-tracing-reverse,2209,1332,3541,136.947874,False,0.0,gpt-5-nano,path-tracing-reverse,136.947874,False,0.0,False,136.947874 +9bbd4c87-46d0-4cbe-bdfc-e74e312bc832,gpt-5-nano,openai,form-filling,11376,9125,20501,256.983497,True,1.0,gpt-5-nano,form-filling,256.983497,True,0.6,True,256.983497 +f024c09f-67a1-4fdc-9db6-8853dacca02e,moonshotai/Kimi-K2-Instruct-0905,together_ai,count-dataset-tokens,11247,4946,16193,564.917355,False,0.0,moonshotai/Kimi-K2-Instruct-0905,count-dataset-tokens,564.917355,False,0.2,False,564.917355 +97ecf028-b6af-45fe-b1c6-3779feb26b1a,claude-opus-4-1-20250805,anthropic,make-doom-for-mips,18469,6510,24979,901.917677,False,0.0,claude-opus-4-1-20250805,make-doom-for-mips,901.917677,False,0.0,False,901.917677 +be166240-44c0-47a6-9802-2086de981cc8,gemini-2.5-pro,gemini,constraints-scheduling,5837,3900,9737,497.636497,True,1.0,gemini-2.5-pro,constraints-scheduling,497.636497,True,1.0,True,497.636497 +7467a2c2-8077-430d-a09e-21efbd2ae18c,gpt-5-nano,openai,winning-avg-corewars,45503,41283,86786,3629.853352,False,0.0,gpt-5-nano,winning-avg-corewars,3629.853352,False,0.0,False,3629.853352 +cd0ffe4c-b7b6-4827-a327-2d34d1b0b6ad,claude-opus-4-1-20250805,anthropic,pypi-server,4958,2815,7773,111.040107,True,1.0,claude-opus-4-1-20250805,pypi-server,111.040107,True,1.0,True,111.040107 +d4b87041-cda1-4319-8c0c-2e2d61f42e52,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-alpine-ssh,4089,4382,8471,950.905527,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-alpine-ssh,950.905527,True,0.2,True,950.905527 +014bc748-6694-44a2-a6dc-ee732ffbb905,grok-code-fast-1,xai,cobol-modernization,5590,2492,8082,153.668445,False,0.0,grok-code-fast-1,cobol-modernization,153.668445,False,0.6,False,153.668445 +d6d3c95f-e1b7-4755-9b50-928646599244,claude-sonnet-4-20250514,anthropic,code-from-image,8626,10186,18812,595.062854,False,0.0,claude-sonnet-4-20250514,code-from-image,595.062854,False,0.2,False,595.062854 +aca9a3cf-9a3f-4780-88e8-ed725137a1ec,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-recovery,6923,5076,11999,750.217438,True,1.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-recovery,750.217438,True,0.4,True,750.217438 +651d6c3f-f87b-44c7-9bfd-e13ff2cace3f,moonshotai/Kimi-K2-Instruct-0905,together_ai,gpt2-codegolf,14338,11484,25822,905.922495,False,0.0,moonshotai/Kimi-K2-Instruct-0905,gpt2-codegolf,905.922495,False,0.0,False,905.922495 +c7b8b4c0-89e6-4fc2-a813-a15b8d72869d,zai-org/GLM-4.5-Air-FP8,together_ai,form-filling,11017,10228,21245,224.783559,True,1.0,zai-org/GLM-4.5-Air-FP8,form-filling,224.783559,True,0.8,True,224.783559 +51b5bd62-b69d-466b-af88-516dc805c0e0,gpt-5,openai,schemelike-metacircular-eval,9585,30275,39860,2401.158472,False,0.0,gpt-5,schemelike-metacircular-eval,2401.158472,False,0.0,False,2401.158472 +bf255481-ad29-4dd8-8c91-b83637ecd598,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-db-truncate,7364,6034,13398,909.242928,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-db-truncate,909.242928,False,0.0,False,909.242928 +16c938ab-cddf-4574-a03e-22dfa1e6f20a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,circuit-fibsqrt,3825,3438,7263,292.816599,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,circuit-fibsqrt,292.816599,False,0.0,False,292.816599 +669853d5-65f0-4664-b562-f36c14dbc973,claude-opus-4-1-20250805,anthropic,install-klee-minimal,8667,1643,10310,900.190278,False,0.0,claude-opus-4-1-20250805,install-klee-minimal,900.190278,False,0.0,False,900.190278 +1656a26b-f7fd-409f-8fd2-3ed781dcde33,claude-opus-4-1-20250805,anthropic,train-fasttext,31716,13315,45031,3622.815267,False,0.0,claude-opus-4-1-20250805,train-fasttext,3622.815267,False,0.2857142857142857,False,3622.815267 +df7d3bd4-68d9-41ad-9134-6f7bee6839b6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,git-leak-recovery,2718,1981,4699,153.461073,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,git-leak-recovery,153.461073,True,1.0,True,153.461073 +a43c3cf3-e59e-47d7-96e8-63d7f7571cee,gemini-2.5-pro,gemini,mteb-retrieve,1998,973,2971,235.588292,False,0.0,gemini-2.5-pro,mteb-retrieve,235.588292,False,0.0,False,235.588292 +ddc92b38-9466-41a5-99ec-e31a709ba96e,gpt-5,openai,sqlite-with-gcov,5598,1463,7061,436.212848,False,0.0,gpt-5,sqlite-with-gcov,436.212848,False,0.3333333333333333,False,436.212848 +066fbfe6-f59c-4fc4-8e3f-41da24ca2026,grok-code-fast-1,xai,make-doom-for-mips,14766,3102,17868,578.118148,False,0.0,grok-code-fast-1,make-doom-for-mips,578.118148,False,0.0,False,578.118148 +6ef22d23-a879-40d3-8a98-ed05816976ae,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pypi-server,9103,4533,13636,713.294589,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pypi-server,713.294589,False,0.0,False,713.294589 +34477d7e-073b-4318-be0e-a3bd68463ff8,gpt-5-nano,openai,pypi-server,5363,2505,7868,689.40874,False,0.0,gpt-5-nano,pypi-server,689.40874,False,0.8,False,689.40874 +f94a492f-d93f-46e1-a3cf-24d0237f98b0,grok-code-fast-1,xai,feal-differential-cryptanalysis,2190,1155,3345,149.303963,False,0.0,grok-code-fast-1,feal-differential-cryptanalysis,149.303963,False,0.0,False,149.303963 +0265fe6c-a1dc-4955-8713-c6a8b726103e,grok-4-0709,xai,path-tracing-reverse,2769,4005,6774,1856.440668,False,0.0,grok-4-0709,path-tracing-reverse,1856.440668,False,0.0,False,1856.440668 +2e1384ad-3a24-44aa-8735-33204c510876,openai/gpt-oss-120b,together_ai,path-tracing,8570,3511,12081,205.974847,False,0.0,openai/gpt-oss-120b,path-tracing,205.974847,False,0.0,False,205.974847 +548fad12-326a-47c7-ac45-7f15c1f847a4,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,chess-best-move,2847,1697,4544,348.819779,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,chess-best-move,348.819779,False,0.0,False,348.819779 +e6dab586-0ee2-4913-96ca-b84e461dd698,claude-opus-4-1-20250805,anthropic,build-pov-ray,45603,17071,62674,2203.271707,False,0.0,claude-opus-4-1-20250805,build-pov-ray,2203.271707,False,0.75,False,2203.271707 +5c64a0ce-0d37-43dd-b734-44f1e0bbd3f2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,winning-avg-corewars,13457,9402,22859,1018.186355,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,winning-avg-corewars,1018.186355,False,0.0,False,1018.186355 +f81f030a-7184-492c-aab0-5745976961b6,claude-opus-4-1-20250805,anthropic,build-pmars,836,236,1072,1774.903555,False,0.0,claude-opus-4-1-20250805,build-pmars,1774.903555,False,0.5,False,1774.903555 +f7b1dcee-8e5c-48e5-966a-3f61c7bd2d35,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-with-gcov,3374,1145,4519,145.642585,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-with-gcov,145.642585,False,0.4,False,145.642585 +92ad4c47-85fb-4799-9501-d9a758ee09d9,gemini-2.5-pro,gemini,pytorch-model-recovery,14185,5485,19670,447.808289,True,1.0,gemini-2.5-pro,pytorch-model-recovery,447.808289,True,1.0,True,447.808289 +d0cc5d13-8e80-4833-a3ee-3dbad4f2b037,grok-4-0709,xai,circuit-fibsqrt,1412,707,2119,3604.803117,False,0.0,grok-4-0709,circuit-fibsqrt,3604.803117,False,0.0,False,3604.803117 +cd492866-5608-40c9-86d0-0cb7fa6682df,gemini-2.5-flash,gemini,hf-model-inference,2938,1421,4359,80.987162,False,0.0,gemini-2.5-flash,hf-model-inference,80.987162,False,0.6,False,80.987162 +2a545337-3758-4fba-9002-a02d342df170,gemini-2.5-flash,gemini,cancel-async-tasks,1947,821,2768,86.1771,False,0.0,gemini-2.5-flash,cancel-async-tasks,86.1771,False,0.2,False,86.1771 +b0174e4f-1dbc-4e8d-92a7-1ea442ffc51e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,password-recovery,3698,2230,5928,1551.820187,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,password-recovery,1551.820187,False,0.2,False,1551.820187 +e027b7b1-63bc-40f8-bf55-51fafff0b103,claude-opus-4-1-20250805,anthropic,chess-best-move,9490,6336,15826,216.625252,False,0.0,claude-opus-4-1-20250805,chess-best-move,216.625252,False,0.0,False,216.625252 +5c1ae364-88fd-45f3-8965-aed30240426c,gpt-5-mini,openai,pypi-server,2892,1409,4301,122.950557,True,1.0,gpt-5-mini,pypi-server,122.950557,True,0.8,True,122.950557 +346b266b-605c-4111-9355-09cb07bcb186,grok-code-fast-1,xai,qemu-alpine-ssh,1183,961,2144,169.544178,False,0.0,grok-code-fast-1,qemu-alpine-ssh,169.544178,False,0.0,False,169.544178 +451ba60c-f495-47a5-8934-d6d19e399f0f,claude-opus-4-1-20250805,anthropic,reverse-engineering,11466,9091,20557,1801.516985,False,0.0,claude-opus-4-1-20250805,reverse-engineering,1801.516985,False,0.0,False,1801.516985 +710d6e3d-908f-4740-b092-fab2159d60fc,gemini-2.5-pro,gemini,vulnerable-secret,6393,1986,8379,840.93766,True,1.0,gemini-2.5-pro,vulnerable-secret,840.93766,True,0.8,True,840.93766 +c8e6a74b-a916-4ac5-94e3-15bbe499d3c3,OpenAI/gpt-oss-20B,together_ai,fix-git,8977,11989,20966,911.780632,False,0.0,OpenAI/gpt-oss-20B,fix-git,911.780632,False,0.2,False,911.780632 +ef387938-4766-4702-ba44-0f1eed497cb2,claude-sonnet-4-20250514,anthropic,break-filter-js-from-html,6326,6476,12802,1201.584268,False,0.0,claude-sonnet-4-20250514,break-filter-js-from-html,1201.584268,False,0.0,False,1201.584268 +5790beb7-d658-460b-9988-92d5ad239da9,moonshotai/Kimi-K2-Instruct-0905,together_ai,db-wal-recovery,8577,4956,13533,957.637056,False,0.0,moonshotai/Kimi-K2-Instruct-0905,db-wal-recovery,957.637056,False,0.0,False,957.637056 +e3ade6ea-eb25-46fe-b73e-f23c923b94fc,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-differential-cryptanalysis,20869,23844,44713,1299.273454,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-differential-cryptanalysis,1299.273454,False,0.0,False,1299.273454 +645746e6-645e-4c35-9afc-87f4d2a6422e,deepseek-ai/DeepSeek-V3.1,together_ai,dna-insert,10543,6086,16629,180.13392,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-insert,180.13392,False,0.0,False,180.13392 +0c90ba40-dfcb-49c4-8df6-644da427922f,gpt-5,openai,financial-document-processor,10848,8701,19549,527.003723,False,0.0,gpt-5,financial-document-processor,527.003723,False,0.0,False,527.003723 +682a1d0f-6c73-418b-9ccb-91c68c9c52ee,gpt-5-nano,openai,extract-elf,15750,3171,18921,272.078997,False,0.0,gpt-5-nano,extract-elf,272.078997,False,0.2,False,272.078997 +2480e1e3-7d49-4248-bd01-2e4c90947e6b,grok-code-fast-1,xai,merge-diff-arc-agi-task,8013,2589,10602,801.21029,True,1.0,grok-code-fast-1,merge-diff-arc-agi-task,801.21029,True,0.8,True,801.21029 +faf4e312-450e-4fb2-bb93-b971ae700a88,grok-4-0709,xai,chess-best-move,8891,1230,10121,900.266951,False,0.0,grok-4-0709,chess-best-move,900.266951,False,0.0,False,900.266951 +634f39b8-512a-4f46-8b0d-dbbed57ffd01,gemini-2.5-pro,gemini,make-mips-interpreter,30193,39760,69953,1802.37413,False,0.0,gemini-2.5-pro,make-mips-interpreter,1802.37413,False,0.0,False,1802.37413 +d4b97c07-8f82-40c3-83fb-b6ec8b5665d5,grok-code-fast-1,xai,configure-git-webserver,5042,1170,6212,155.284657,False,0.0,grok-code-fast-1,configure-git-webserver,155.284657,False,0.0,False,155.284657 +01b5556e-d6be-49cd-85bf-30724e006683,gpt-5,openai,tune-mjcf,8801,5341,14142,903.789968,False,0.0,gpt-5,tune-mjcf,903.789968,False,0.0,False,903.789968 +5c3560d2-ca9d-453a-9a17-aa4b022d72b1,claude-opus-4-1-20250805,anthropic,financial-document-processor,11483,5850,17333,433.509708,False,0.0,claude-opus-4-1-20250805,financial-document-processor,433.509708,False,0.0,False,433.509708 +85eed476-988c-4c70-a41c-be830e1dcdc3,openai/gpt-oss-120b,together_ai,break-filter-js-from-html,5757,7814,13571,1254.780368,False,0.0,openai/gpt-oss-120b,break-filter-js-from-html,1254.780368,False,0.0,False,1254.780368 +f58f6292-ae5e-4699-abb2-4a9a20f8da86,moonshotai/Kimi-K2-Instruct-0905,together_ai,configure-git-webserver,7277,3198,10475,369.364724,True,1.0,moonshotai/Kimi-K2-Instruct-0905,configure-git-webserver,369.364724,True,0.6,True,369.364724 +2645a1f5-2ae3-4937-a1eb-f51f8e44f383,grok-4-0709,xai,gpt2-codegolf,1051,543,1594,165.626822,False,0.0,grok-4-0709,gpt2-codegolf,165.626822,False,0.0,False,165.626822 +7ee4a787-9089-44a9-a2b5-36d1ef3de55b,gpt-5-nano,openai,dna-insert,962,2150,3112,360.376733,False,0.0,gpt-5-nano,dna-insert,360.376733,False,0.0,False,360.376733 +f6a4a0f7-99ac-4714-ba7a-d2a2c2b303d5,OpenAI/gpt-oss-20B,together_ai,make-mips-interpreter,1398,2100,3498,398.553723,False,0.0,OpenAI/gpt-oss-20B,make-mips-interpreter,398.553723,False,0.0,False,398.553723 +8c0ff9ee-3307-415d-ae8a-bfc0e59ec372,gemini-2.5-pro,gemini,git-leak-recovery,2212,1356,3568,247.138438,True,1.0,gemini-2.5-pro,git-leak-recovery,247.138438,True,1.0,True,247.138438 +b15f9917-b080-4007-85c0-461f6a5172c8,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-retrieve,2280,1258,3538,125.278376,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-retrieve,125.278376,False,0.0,False,125.278376 +609bf8bc-f2f9-41d8-8618-40232ace33a2,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,bn-fit-modify,27949,4873,32822,1356.639144,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,bn-fit-modify,1356.639144,False,0.0,False,1356.639144 +b3806b10-c331-4cfc-b6af-c6deda827499,grok-4-0709,xai,path-tracing,3718,3624,7342,1800.046095,False,0.0,grok-4-0709,path-tracing,1800.046095,False,0.0,False,1800.046095 +c26f7a7b-2f4b-4ff1-8232-7e44d8fb28bb,gpt-5,openai,train-fasttext,13162,7879,21041,3648.158015,False,0.0,gpt-5,train-fasttext,3648.158015,False,0.0,False,3648.158015 +6ffea995-64ee-40bf-acfe-eef9119779a7,grok-code-fast-1,xai,pypi-server,3874,1626,5500,164.824983,True,1.0,grok-code-fast-1,pypi-server,164.824983,True,0.8,True,164.824983 +7efcbc2e-b819-4733-8889-559bd94012cb,gemini-2.5-flash,gemini,adaptive-rejection-sampler,10695,35736,46431,907.473425,False,0.0,gemini-2.5-flash,adaptive-rejection-sampler,907.473425,False,0.0,False,907.473425 +bd34762d-78dd-4358-a303-dfa71baa2f75,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,merge-diff-arc-agi-task,9872,3918,13790,277.19801,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,merge-diff-arc-agi-task,277.19801,True,0.4,True,277.19801 +1eedae27-bd40-4e49-a7ea-7e53f3ea2559,grok-code-fast-1,xai,log-summary-date-ranges,7271,3807,11078,135.948771,False,0.0,grok-code-fast-1,log-summary-date-ranges,135.948771,False,0.0,False,135.948771 +c7b00e2a-235a-4a13-8741-815937b1d10d,claude-opus-4-1-20250805,anthropic,fix-ocaml-gc,30244,13473,43717,1770.354747,True,1.0,claude-opus-4-1-20250805,fix-ocaml-gc,1770.354747,True,0.5,True,1770.354747 +d46da707-f363-421d-a013-9f55fa03bc25,grok-4-0709,xai,train-fasttext,28435,8862,37297,3601.974087,False,0.0,grok-4-0709,train-fasttext,3601.974087,False,0.2,False,3601.974087 +82ec03ad-af46-41e1-8425-3cb4a0fb497a,moonshotai/Kimi-K2-Instruct-0905,together_ai,constraints-scheduling,6009,3985,9994,360.88604,False,0.0,moonshotai/Kimi-K2-Instruct-0905,constraints-scheduling,360.88604,False,0.6,False,360.88604 +6eefad9f-1b07-4d90-8b80-8a53d6f083e3,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-klee-minimal,10815,3093,13908,1730.283575,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-klee-minimal,1730.283575,False,0.0,False,1730.283575 +f913c078-a29f-4c0a-a0b5-0592cd51c8dd,gpt-5,openai,feal-linear-cryptanalysis,7275,2906,10181,656.289345,True,1.0,gpt-5,feal-linear-cryptanalysis,656.289345,True,1.0,True,656.289345 +8309d400-74b4-4c07-9df7-7c5d749202ea,gpt-5-mini,openai,install-klee-minimal,6564,3524,10088,900.035298,False,0.0,gpt-5-mini,install-klee-minimal,900.035298,False,0.0,False,900.035298 +2833003f-73f5-44b2-a86b-60481d610544,OpenAI/gpt-oss-20B,together_ai,qemu-startup,1101,592,1693,39.335629,False,0.0,OpenAI/gpt-oss-20B,qemu-startup,39.335629,False,0.0,False,39.335629 +78302e81-3543-4e55-a824-613628e153b7,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cobol-modernization,5641,8139,13780,900.001416,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cobol-modernization,900.001416,False,0.0,False,900.001416 +b58843e7-272e-4ef2-938b-f02092be20dd,grok-4-0709,xai,cobol-modernization,3793,2679,6472,900.037524,False,0.0,grok-4-0709,cobol-modernization,900.037524,False,0.2,False,900.037524 +308438a9-434b-4e9c-9e07-291bfcdbb6a8,openai/gpt-oss-120b,together_ai,fix-ocaml-gc,15950,7426,23376,3622.551929,False,0.0,openai/gpt-oss-120b,fix-ocaml-gc,3622.551929,False,0.0,False,3622.551929 +26ad594b-f57e-4149-8603-5f0f30164e7d,deepseek-ai/DeepSeek-V3.1,together_ai,feal-differential-cryptanalysis,19945,21011,40956,1332.276715,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-differential-cryptanalysis,1332.276715,False,0.0,False,1332.276715 +51c3aa97-9c56-4bef-8fe4-1fa6065b2e7b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,port-compressor,84335,65367,149702,3600.001236,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,port-compressor,3600.001236,False,0.0,False,3600.001236 +849a7209-4d31-44c5-92e2-e580ba21d6c5,deepseek-ai/DeepSeek-V3.1,together_ai,crack-7z-hash,9337,4199,13536,683.427737,True,1.0,deepseek-ai/DeepSeek-V3.1,crack-7z-hash,683.427737,True,0.8,True,683.427737 +b4dcd200-3749-427a-aa0a-e020839f3326,grok-4-0709,xai,db-wal-recovery,2532,3214,5746,463.301235,True,1.0,grok-4-0709,db-wal-recovery,463.301235,True,0.2,True,463.301235 +d7a5d5ca-e2bb-4d0b-9cd1-0e8fb4b699f0,gpt-5,openai,run-pdp11-code,12218,10526,22744,914.572972,False,0.0,gpt-5,run-pdp11-code,914.572972,False,0.0,False,914.572972 +4b55825a-b820-4484-99fb-4cf6faa06238,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,distribution-search,3616,2368,5984,243.073717,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,distribution-search,243.073717,False,0.0,False,243.073717 +3daab2bb-9f6c-4a3f-aae5-96054b8a365c,gpt-5-mini,openai,largest-eigenval,12319,12812,25131,950.066419,False,0.0,gpt-5-mini,largest-eigenval,950.066419,False,0.0,False,950.066419 +8ca72de2-e04c-4965-9955-fb7e9255a194,gpt-5-nano,openai,mteb-retrieve,32349,23646,55995,1875.76028,False,0.0,gpt-5-nano,mteb-retrieve,1875.76028,False,0.0,False,1875.76028 +b63b9979-6887-48d0-89a0-04aad774acb9,gemini-2.5-flash,gemini,schemelike-metacircular-eval,36666,83150,119816,2411.472757,False,0.0,gemini-2.5-flash,schemelike-metacircular-eval,2411.472757,False,0.2,False,2411.472757 +364b4a60-23d4-4181-a183-b09e3bf200be,claude-opus-4-1-20250805,anthropic,password-recovery,5852,4637,10489,260.188883,True,1.0,claude-opus-4-1-20250805,password-recovery,260.188883,True,0.5555555555555556,True,260.188883 +f0f64979-e489-49dc-85a1-fe1cbc592a79,zai-org/GLM-4.5-Air-FP8,together_ai,feal-linear-cryptanalysis,21578,19106,40684,1806.338421,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-linear-cryptanalysis,1806.338421,False,0.0,False,1806.338421 +9f47b0e3-05bb-4703-a172-76b774201914,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing,15627,12358,27985,622.446642,False,0.0,deepseek-ai/DeepSeek-V3.1,path-tracing,622.446642,False,0.0,False,622.446642 +5d04e8a7-b826-4e79-840a-af4302fc43e2,gemini-2.5-pro,gemini,path-tracing-reverse,12504,12997,25501,1804.042435,False,0.0,gemini-2.5-pro,path-tracing-reverse,1804.042435,False,0.0,False,1804.042435 +9d8844cf-a603-4d51-a136-a18e75d3c67b,gemini-2.5-flash,gemini,pytorch-model-recovery,4061,10613,14674,900.007547,False,0.0,gemini-2.5-flash,pytorch-model-recovery,900.007547,False,0.2,False,900.007547 +23f3c0c3-60ed-4ee6-b36e-d77d0c250506,openai/gpt-oss-120b,together_ai,gpt2-codegolf,3161,7953,11114,901.131075,False,0.0,openai/gpt-oss-120b,gpt2-codegolf,901.131075,False,0.0,False,901.131075 +c77b43a3-de6f-41f8-8500-a23196b70b3e,claude-opus-4-1-20250805,anthropic,log-summary-date-ranges,7628,1858,9486,171.94883,True,1.0,claude-opus-4-1-20250805,log-summary-date-ranges,171.94883,True,0.8888888888888888,True,171.94883 +11a0bd98-5cd2-4fa9-8e23-b581bd0f71bd,OpenAI/gpt-oss-20B,together_ai,wasm-pipeline,3242,7431,10673,901.233305,False,0.0,OpenAI/gpt-oss-20B,wasm-pipeline,901.233305,False,0.0,False,901.233305 +d274f36f-cbc1-4837-b9da-0e41efd61101,claude-sonnet-4-20250514,anthropic,fix-git,3760,2047,5807,103.529054,True,1.0,claude-sonnet-4-20250514,fix-git,103.529054,True,1.0,True,103.529054 +e859f139-86f3-46f2-bfee-c76d9a4af199,moonshotai/Kimi-K2-Instruct-0905,together_ai,vulnerable-secret,13789,10085,23874,904.522982,False,0.0,moonshotai/Kimi-K2-Instruct-0905,vulnerable-secret,904.522982,False,0.2,False,904.522982 +c904789f-a043-4520-8b36-86174e51a350,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cancel-async-tasks,1425,1012,2437,101.834606,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cancel-async-tasks,101.834606,True,0.8,True,101.834606 +6b95e0dd-69f3-47b9-90e0-fcac5abaa2c9,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-alpine-ssh,3707,6332,10039,900.017509,False,0.0,zai-org/GLM-4.5-Air-FP8,qemu-alpine-ssh,900.017509,False,0.0,False,900.017509 +09331612-af95-462e-9ac8-84f8401c065b,gpt-5,openai,install-windows-3.11,4757,1916,6673,290.538304,False,0.0,gpt-5,install-windows-3.11,290.538304,False,0.0,False,290.538304 +208e5257-6ee2-4a92-8f8e-f68712fe9794,gemini-2.5-pro,gemini,schemelike-metacircular-eval,21146,23638,44784,1456.767477,False,0.0,gemini-2.5-pro,schemelike-metacircular-eval,1456.767477,False,0.0,False,1456.767477 +bee85626-fc72-4c57-9109-f3019ca3e8b0,openai/gpt-oss-120b,together_ai,nginx-request-logging,3842,1100,4942,91.825849,True,1.0,openai/gpt-oss-120b,nginx-request-logging,91.825849,True,0.4,True,91.825849 +7651f3ee-ab0d-433f-8810-8305f3535ac8,gpt-5,openai,openssl-selfsigned-cert,2203,1566,3769,111.747008,True,1.0,gpt-5,openssl-selfsigned-cert,111.747008,True,1.0,True,111.747008 +bd86c98c-2dc2-4204-ab57-36ea899eb2e2,gemini-2.5-pro,gemini,gpt2-codegolf,7599,10550,18149,578.831026,False,0.0,gemini-2.5-pro,gpt2-codegolf,578.831026,False,0.0,False,578.831026 +4d28bf30-11b5-4523-8dc5-b37242f17efb,gpt-5-nano,openai,schemelike-metacircular-eval,21285,35677,56962,2411.539425,False,0.0,gpt-5-nano,schemelike-metacircular-eval,2411.539425,False,0.2,False,2411.539425 +3dd1acc3-56b0-42c5-902a-0c0d3a7955f5,zai-org/GLM-4.5-Air-FP8,together_ai,financial-document-processor,4315,3284,7599,120.205635,False,0.0,zai-org/GLM-4.5-Air-FP8,financial-document-processor,120.205635,False,0.0,False,120.205635 +a6e6f102-fd32-4f81-b389-2786ed6a5c07,gemini-2.5-pro,gemini,crack-7z-hash,9262,2988,12250,432.637942,True,1.0,gemini-2.5-pro,crack-7z-hash,432.637942,True,0.8,True,432.637942 +5d46de94-8c27-43d6-933f-6d8adb739eef,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-retrieve,3934,3327,7261,436.124129,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-retrieve,436.124129,False,0.0,False,436.124129 +c8b937df-3356-45ee-8b8a-53b464d80dd6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,hf-model-inference,8466,4115,12581,573.637162,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,hf-model-inference,573.637162,False,0.0,False,573.637162 +86c503f7-e52c-4968-9a1e-522a65e56d3a,gemini-2.5-flash,gemini,db-wal-recovery,2472,5407,7879,904.015827,False,0.0,gemini-2.5-flash,db-wal-recovery,904.015827,False,0.0,False,904.015827 +a5b84316-9b3f-49b5-9cd6-34cef6e02703,OpenAI/gpt-oss-20B,together_ai,openssl-selfsigned-cert,724,770,1494,43.791773,False,0.0,OpenAI/gpt-oss-20B,openssl-selfsigned-cert,43.791773,False,0.2,False,43.791773 +2ebf77d2-5ed9-47fe-b2f7-11ce9c4ffbc2,gpt-5-nano,openai,wasm-pipeline,14160,9558,23718,938.986527,False,0.0,gpt-5-nano,wasm-pipeline,938.986527,False,0.0,False,938.986527 +16cc88fa-70e7-4db8-9c81-2ed8f543f4d1,claude-opus-4-1-20250805,anthropic,feal-linear-cryptanalysis,13838,10893,24731,1800.000444,False,0.0,claude-opus-4-1-20250805,feal-linear-cryptanalysis,1800.000444,False,0.0,False,1800.000444 +74a87cbc-94ad-4fa5-b828-3b7a5b755a5e,zai-org/GLM-4.5-Air-FP8,together_ai,financial-document-processor,17418,9373,26791,1200.000845,False,0.0,zai-org/GLM-4.5-Air-FP8,financial-document-processor,1200.000845,False,0.0,False,1200.000845 +e4b67a7c-7e5c-4904-8cbc-42b2922466da,gpt-5-nano,openai,circuit-fibsqrt,29614,28948,58562,3602.854599,False,0.0,gpt-5-nano,circuit-fibsqrt,3602.854599,False,0.0,False,3602.854599 +c415280f-a7d7-42f9-b619-96e962697aef,deepseek-ai/DeepSeek-V3.1,together_ai,db-wal-recovery,10079,8541,18620,904.307912,False,0.0,deepseek-ai/DeepSeek-V3.1,db-wal-recovery,904.307912,False,0.0,False,904.307912 +59c2a27d-ff13-426b-b7bd-659205ca9654,gemini-2.5-pro,gemini,configure-git-webserver,5255,1304,6559,308.296703,False,0.0,gemini-2.5-pro,configure-git-webserver,308.296703,False,0.0,False,308.296703 +4ec37157-0f8b-459f-9961-d7312aa8a6c4,moonshotai/Kimi-K2-Instruct-0905,together_ai,log-summary-date-ranges,12620,3144,15764,166.977851,False,0.0,moonshotai/Kimi-K2-Instruct-0905,log-summary-date-ranges,166.977851,False,0.8,False,166.977851 +725182bf-d40c-4369-a573-d75b4e0e0005,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-with-gcov,14850,3510,18360,313.2702,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-with-gcov,313.2702,False,0.4,False,313.2702 +60a0eaef-b10b-4181-a28c-2234d2979154,deepseek-ai/DeepSeek-V3.1,together_ai,tune-mjcf,11451,10477,21928,900.099051,False,0.0,deepseek-ai/DeepSeek-V3.1,tune-mjcf,900.099051,False,0.0,False,900.099051 +d3847054-5ee8-45d9-8739-d9c18f287e2e,claude-sonnet-4-20250514,anthropic,run-pdp11-code,9566,8551,18117,559.257241,False,0.0,claude-sonnet-4-20250514,run-pdp11-code,559.257241,False,0.0,False,559.257241 +174614b7-18f5-49a4-930b-09a24b899f5f,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing-reverse,9097,3068,12165,304.827997,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing-reverse,304.827997,False,0.0,False,304.827997 +4470f1d3-f48f-4640-b5bc-a3a3d2ae4472,openai/gpt-oss-120b,together_ai,path-tracing-reverse,14712,16796,31508,1974.918343,False,0.0,openai/gpt-oss-120b,path-tracing-reverse,1974.918343,False,0.0,False,1974.918343 +ba279e82-1c1f-4a4f-bde4-8a32712c63d7,openai/gpt-oss-120b,together_ai,path-tracing,3054,2612,5666,327.615089,False,0.0,openai/gpt-oss-120b,path-tracing,327.615089,False,0.0,False,327.615089 +b0cd3510-5146-4a50-bafb-7da7c09654c5,moonshotai/Kimi-K2-Instruct-0905,together_ai,filter-js-from-html,3375,3510,6885,707.178394,False,0.0,moonshotai/Kimi-K2-Instruct-0905,filter-js-from-html,707.178394,False,0.0,False,707.178394 +817d7850-7fe1-4421-ab53-57b16da14659,gemini-2.5-pro,gemini,reverse-engineering,8085,6495,14580,898.736955,False,0.0,gemini-2.5-pro,reverse-engineering,898.736955,False,0.0,False,898.736955 +58f55fcb-1a6f-4e3e-b988-68bc4fbb8b54,gemini-2.5-pro,gemini,count-dataset-tokens,10416,2156,12572,910.470714,False,0.0,gemini-2.5-pro,count-dataset-tokens,910.470714,False,0.0,False,910.470714 +6fe5b1bf-fdf7-4e7b-bc91-671c8b2cdb4a,zai-org/GLM-4.5-Air-FP8,together_ai,write-compressor,11505,8395,19900,902.319958,False,0.0,zai-org/GLM-4.5-Air-FP8,write-compressor,902.319958,False,0.0,False,902.319958 +1e869927-ca46-4089-b477-ae0e1573a940,claude-sonnet-4-20250514,anthropic,build-cython-ext,13591,4392,17983,904.529451,False,0.0,claude-sonnet-4-20250514,build-cython-ext,904.529451,False,0.0,False,904.529451 +b7db7a19-6ff8-444b-adb0-43c7f555ac70,gemini-2.5-flash,gemini,password-recovery,1618,2552,4170,1325.439506,False,0.0,gemini-2.5-flash,password-recovery,1325.439506,False,0.0,False,1325.439506 +3e1915da-6f56-4c1c-8599-75bc064649bb,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,crack-7z-hash,10287,3639,13926,315.384396,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,crack-7z-hash,315.384396,False,0.0,False,315.384396 +022aa524-d479-4a4d-b240-8b59085c88c0,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing,21108,20924,42032,1820.851112,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing,1820.851112,False,0.0,False,1820.851112 +17675549-e130-45c0-a7ed-c3cfcc2add4f,grok-4-0709,xai,form-filling,3067,1665,4732,372.071094,False,0.0,grok-4-0709,form-filling,372.071094,False,0.2,False,372.071094 +8996f43c-62b5-4d28-87f6-d4bb845087cb,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sparql-university,1389,655,2044,41.159927,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sparql-university,41.159927,False,0.0,False,41.159927 +3f228cc5-63d7-4967-89ec-e7900164b9fa,gpt-5-nano,openai,pytorch-model-recovery,9435,11276,20711,903.244122,False,0.0,gpt-5-nano,pytorch-model-recovery,903.244122,False,0.0,False,903.244122 +9678e0fd-cdbd-4070-b1e4-caf6ea18e362,gemini-2.5-pro,gemini,video-processing,2776,2002,4778,498.938253,False,0.0,gemini-2.5-pro,video-processing,498.938253,False,0.0,False,498.938253 +4f9d41cd-5294-4170-9300-ebdae84af03a,zai-org/GLM-4.5-Air-FP8,together_ai,merge-diff-arc-agi-task,17977,7187,25164,221.573557,False,0.0,zai-org/GLM-4.5-Air-FP8,merge-diff-arc-agi-task,221.573557,False,0.0,False,221.573557 +1fc5b8b3-54fb-4b1a-b003-1fb04ad2826c,grok-code-fast-1,xai,gpt2-codegolf,1082,614,1696,69.75182,False,0.0,grok-code-fast-1,gpt2-codegolf,69.75182,False,0.0,False,69.75182 +9b849f08-0957-4233-9d7c-a4f3dca594e9,openai/gpt-oss-120b,together_ai,configure-git-webserver,5189,1322,6511,379.191672,True,1.0,openai/gpt-oss-120b,configure-git-webserver,379.191672,True,0.6,True,379.191672 +ba67c269-687a-4dc4-9de7-906e447f9713,gpt-5,openai,fix-ocaml-gc,18795,14599,33394,3627.691823,False,0.0,gpt-5,fix-ocaml-gc,3627.691823,False,0.0,False,3627.691823 +c76eb7ec-e7bc-48ed-bec1-6905f5fea61d,claude-opus-4-1-20250805,anthropic,feal-linear-cryptanalysis,26681,29960,56641,1800.005004,False,0.0,claude-opus-4-1-20250805,feal-linear-cryptanalysis,1800.005004,False,0.0,False,1800.005004 +e05f3bd0-827f-471b-80fa-6933f5160061,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,circuit-fibsqrt,3347,3770,7117,455.85337,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,circuit-fibsqrt,455.85337,False,0.0,False,455.85337 +115fbaaf-0a48-4bbc-955d-c8243d8e1277,OpenAI/gpt-oss-20B,together_ai,run-pdp11-code,2807,10400,13207,1041.740275,False,0.0,OpenAI/gpt-oss-20B,run-pdp11-code,1041.740275,False,0.0,False,1041.740275 +99dc6c5d-2b02-4770-a04b-0b69eda27240,gpt-5,openai,regex-log,1499,721,2220,186.682062,True,1.0,gpt-5,regex-log,186.682062,True,1.0,True,186.682062 +e58e20bd-bf09-4fc1-b9a0-bba488b438f2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,chess-best-move,10790,3278,14068,322.225343,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,chess-best-move,322.225343,False,0.0,False,322.225343 +c8b14e1d-3119-4e5d-93ca-39440cbfe117,OpenAI/gpt-oss-20B,together_ai,crack-7z-hash,882,223,1105,6.494683,False,0.0,OpenAI/gpt-oss-20B,crack-7z-hash,6.494683,False,0.0,False,6.494683 +82c0fa3f-e29d-4316-8519-2e2b3df4b562,claude-opus-4-1-20250805,anthropic,prove-plus-comm,2145,1429,3574,91.096263,True,1.0,claude-opus-4-1-20250805,prove-plus-comm,91.096263,True,1.0,True,91.096263 +fd6ad47b-0939-4d6a-bbea-35fdf880f3ac,grok-code-fast-1,xai,schemelike-metacircular-eval,4724,3717,8441,1060.356559,False,0.0,grok-code-fast-1,schemelike-metacircular-eval,1060.356559,False,0.0,False,1060.356559 +54d1e8fc-3838-4bb7-a068-256012fe8d8e,claude-opus-4-1-20250805,anthropic,db-wal-recovery,6575,4389,10964,506.926065,False,0.0,claude-opus-4-1-20250805,db-wal-recovery,506.926065,False,0.0,False,506.926065 +67f6ab68-2c9f-43d1-83d5-a8a33ada9ad1,openai/gpt-oss-120b,together_ai,hf-model-inference,1817,1365,3182,81.434178,False,0.0,openai/gpt-oss-120b,hf-model-inference,81.434178,False,0.0,False,81.434178 +c77ddb80-11d1-4cb8-bd57-29e8714e12cb,openai/gpt-oss-120b,together_ai,qemu-startup,1215,1181,2396,140.478451,False,0.0,openai/gpt-oss-120b,qemu-startup,140.478451,False,0.0,False,140.478451 +fde69992-1800-47c4-9d93-91cf2c32cc66,gpt-5-nano,openai,merge-diff-arc-agi-task,10843,5760,16603,503.875515,False,0.0,gpt-5-nano,merge-diff-arc-agi-task,503.875515,False,0.2,False,503.875515 +45113b8f-5122-4a49-819d-f18ec0fd864c,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-startup,1964,1964,3928,149.373774,False,0.0,deepseek-ai/DeepSeek-V3.1,qemu-startup,149.373774,False,0.2,False,149.373774 +e4da006e-8250-4cb3-b54c-42d38e2be7cd,OpenAI/gpt-oss-20B,together_ai,build-pmars,298,2308,2606,900.788083,False,0.0,OpenAI/gpt-oss-20B,build-pmars,900.788083,False,0.0,False,900.788083 +123b234a-2a31-473d-937b-dde198f48837,gpt-5-mini,openai,filter-js-from-html,4272,3418,7690,567.152518,False,0.0,gpt-5-mini,filter-js-from-html,567.152518,False,0.0,False,567.152518 +677bd8bc-ab5e-4a94-b354-58709e0c0e5e,grok-4-0709,xai,port-compressor,20972,37129,58101,3600.002399,False,0.0,grok-4-0709,port-compressor,3600.002399,False,0.0,False,3600.002399 +d9153ded-2d0e-4aee-9922-933e6d6a59df,grok-code-fast-1,xai,pytorch-model-recovery,4738,3326,8064,165.028589,True,1.0,grok-code-fast-1,pytorch-model-recovery,165.028589,True,0.8,True,165.028589 +cad02dd5-5fbb-4a25-81b3-d19768f5577f,gemini-2.5-pro,gemini,bn-fit-modify,26334,14043,40377,3181.10882,False,0.0,gemini-2.5-pro,bn-fit-modify,3181.10882,False,0.0,False,3181.10882 +452415ac-4965-4f39-998d-57cbbcc24b55,gpt-5,openai,feal-differential-cryptanalysis,5437,4643,10080,460.952586,False,0.0,gpt-5,feal-differential-cryptanalysis,460.952586,False,0.0,False,460.952586 +5854f038-62dd-4075-ab0a-13f36ff088f4,claude-opus-4-1-20250805,anthropic,dna-assembly,20616,15367,35983,511.076769,False,0.0,claude-opus-4-1-20250805,dna-assembly,511.076769,False,0.0,False,511.076769 +8e9968cb-4a93-4f72-9e8c-a205db4744f0,gemini-2.5-pro,gemini,prove-plus-comm,1890,1753,3643,330.444313,True,1.0,gemini-2.5-pro,prove-plus-comm,330.444313,True,0.8,True,330.444313 +30bdcb90-bc1d-4a29-9096-19acace470b1,gpt-5-nano,openai,password-recovery,3582,4449,8031,1666.422786,False,0.0,gpt-5-nano,password-recovery,1666.422786,False,0.0,False,1666.422786 +9e91b193-0a4d-43b1-879c-101a4c003b74,gemini-2.5-flash,gemini,path-tracing,3133,15734,18867,604.98068,False,0.0,gemini-2.5-flash,path-tracing,604.98068,False,0.0,False,604.98068 +79960a0a-c5aa-4468-a339-d3845f498f43,deepseek-ai/DeepSeek-V3.1,together_ai,constraints-scheduling,5880,4281,10161,350.990819,True,1.0,deepseek-ai/DeepSeek-V3.1,constraints-scheduling,350.990819,True,0.8,True,350.990819 +4e5a2fd5-7d67-499f-a773-85e4588ef92e,grok-4-0709,xai,circuit-fibsqrt,3821,1243,5064,4113.21673,False,0.0,grok-4-0709,circuit-fibsqrt,4113.21673,False,0.0,False,4113.21673 +31b9b3bf-c77d-4ac8-a92f-e11fdd001ce3,openai/gpt-oss-120b,together_ai,sqlite-with-gcov,5112,1295,6407,408.31915,True,1.0,openai/gpt-oss-120b,sqlite-with-gcov,408.31915,True,0.8,True,408.31915 +80be214b-0f04-4ee2-9316-7635e4fa5b4b,gpt-5-nano,openai,openssl-selfsigned-cert,8738,10534,19272,904.478958,False,0.0,gpt-5-nano,openssl-selfsigned-cert,904.478958,False,0.6,False,904.478958 +e9cf0f4f-85fe-42ac-903a-6230bf4cc8ce,grok-code-fast-1,xai,make-doom-for-mips,15332,2744,18076,636.112899,False,0.0,grok-code-fast-1,make-doom-for-mips,636.112899,False,0.0,False,636.112899 +e6572517-37bf-41b4-b946-125ef1b835fa,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-recovery,14543,11696,26239,900.633301,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-recovery,900.633301,True,0.8,True,900.633301 +673c7816-af07-49bf-ad7e-10c18faa8a22,gpt-5-nano,openai,fix-ocaml-gc,11027,11155,22182,3609.446217,False,0.0,gpt-5-nano,fix-ocaml-gc,3609.446217,False,0.0,False,3609.446217 +4c371ac3-14e4-44bb-8910-f84850c938da,OpenAI/gpt-oss-20B,together_ai,sanitize-git-repo,2154,840,2994,52.370822,False,0.0,OpenAI/gpt-oss-20B,sanitize-git-repo,52.370822,False,0.0,False,52.370822 +023e5e03-2195-4f15-8cfa-203b94caa5a0,openai/gpt-oss-120b,together_ai,chess-best-move,6494,6441,12935,416.918374,False,0.0,openai/gpt-oss-120b,chess-best-move,416.918374,False,0.0,False,416.918374 +03d03caf-4ee8-417b-a4bb-8517706b9f46,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,large-scale-text-editing,5392,3071,8463,418.408032,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,large-scale-text-editing,418.408032,False,0.0,False,418.408032 +927ad9a2-0bea-4e6a-9029-d5d987079509,gemini-2.5-flash,gemini,prove-plus-comm,5070,8819,13889,689.669266,True,1.0,gemini-2.5-flash,prove-plus-comm,689.669266,True,0.6,True,689.669266 +9b89f08b-6f11-4cd0-aa72-46d9326a3baa,gemini-2.5-pro,gemini,form-filling,10218,9743,19961,461.405179,False,0.0,gemini-2.5-pro,form-filling,461.405179,False,0.2,False,461.405179 +09eb55ed-67d8-4a4b-bc05-8d0ab7932fdd,gemini-2.5-flash,gemini,largest-eigenval,3600,2324,5924,927.189793,False,0.0,gemini-2.5-flash,largest-eigenval,927.189793,False,0.0,False,927.189793 +65fe6f82-b3f0-449f-82da-6f921c417aac,gpt-5-nano,openai,make-mips-interpreter,34433,28683,63116,1805.38438,False,0.0,gpt-5-nano,make-mips-interpreter,1805.38438,False,0.0,False,1805.38438 +a8978a4e-9d89-4216-a5dd-1797f34e28e0,claude-opus-4-1-20250805,anthropic,password-recovery,8002,6813,14815,321.28878,True,1.0,claude-opus-4-1-20250805,password-recovery,321.28878,True,0.5555555555555556,True,321.28878 +47c2bdfe-3e1f-48c2-af26-3dcf61216345,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-leaderboard,10084,3100,13184,255.135219,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-leaderboard,255.135219,False,0.0,False,255.135219 +5fcef6f5-c931-40e1-bb3a-c1fff033da31,gpt-5,openai,crack-7z-hash,2860,1580,4440,140.127986,False,0.0,gpt-5,crack-7z-hash,140.127986,False,0.4285714285714285,False,140.127986 +2b8be2b8-79df-47d3-a1b5-785db0a385a4,grok-code-fast-1,xai,video-processing,1596,831,2427,52.054254,False,0.0,grok-code-fast-1,video-processing,52.054254,False,0.0,False,52.054254 +45f5468c-e184-4704-8a82-118e3cf6c0d1,OpenAI/gpt-oss-20B,together_ai,hf-model-inference,2634,2121,4755,129.096941,False,0.0,OpenAI/gpt-oss-20B,hf-model-inference,129.096941,False,0.4,False,129.096941 +e099d492-f6ab-4df8-9335-3911ab79927c,claude-sonnet-4-20250514,anthropic,configure-git-webserver,7898,2911,10809,741.377653,True,1.0,claude-sonnet-4-20250514,configure-git-webserver,741.377653,True,0.6,True,741.377653 +bb68e8e4-4743-44f6-8942-6991e1ff517c,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reverse-engineering,4449,8809,13258,1801.072754,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reverse-engineering,1801.072754,False,0.0,False,1801.072754 +2cf7f8b8-3f04-4ddc-9928-1526e9691f0b,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-ocaml-gc,54326,29686,84012,3602.065217,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-ocaml-gc,3602.065217,False,0.0,False,3602.065217 +687c7370-6aef-4fef-90f1-94d1dda3e35e,gpt-5,openai,adaptive-rejection-sampler,2163,10241,12404,947.259483,False,0.0,gpt-5,adaptive-rejection-sampler,947.259483,False,0.4,False,947.259483 +133cf151-a73c-4e37-b206-1a1ebef24c8a,gpt-5-nano,openai,regex-log,6125,8257,14382,764.706026,False,0.0,gpt-5-nano,regex-log,764.706026,False,0.2,False,764.706026 +8bb9a620-8e27-44eb-8d55-5dd9ad106f92,claude-opus-4-1-20250805,anthropic,filter-js-from-html,8325,8100,16425,214.033549,False,0.0,claude-opus-4-1-20250805,filter-js-from-html,214.033549,False,0.0,False,214.033549 +b5d051e6-2e82-45ab-8b36-3cec87526505,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reshard-c4-data,13635,14564,28199,900.415971,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reshard-c4-data,900.415971,False,0.0,False,900.415971 +57c2f529-8569-4f7c-a775-20eb7625dbba,claude-opus-4-1-20250805,anthropic,polyglot-c-py,7753,5923,13676,206.43158,False,0.0,claude-opus-4-1-20250805,polyglot-c-py,206.43158,False,0.0,False,206.43158 +c7e7cf38-c6d3-4748-89cd-e6ad56e3c377,grok-4-0709,xai,model-extraction-relu-logits,1349,857,2206,925.749087,False,0.0,grok-4-0709,model-extraction-relu-logits,925.749087,False,0.0,False,925.749087 +8c1ffa77-d7a4-4fd5-911f-c02f395e16cc,gemini-2.5-flash,gemini,train-fasttext,20164,4647,24811,1105.799926,False,0.0,gemini-2.5-flash,train-fasttext,1105.799926,False,0.0,False,1105.799926 +286557fb-b1c1-44b2-abec-1bdf121651e0,gpt-5,openai,code-from-image,16788,19786,36574,1200.001344,False,0.0,gpt-5,code-from-image,1200.001344,False,0.4,False,1200.001344 +67f5577d-b536-4e8c-be75-7247fe54d22f,deepseek-ai/DeepSeek-V3.1,together_ai,merge-diff-arc-agi-task,10289,3898,14187,915.268858,False,0.0,deepseek-ai/DeepSeek-V3.1,merge-diff-arc-agi-task,915.268858,False,0.2,False,915.268858 +40a54beb-c1e6-4b7d-9905-9a70233b278c,claude-sonnet-4-20250514,anthropic,regex-log,4249,4292,8541,394.074606,True,1.0,claude-sonnet-4-20250514,regex-log,394.074606,True,0.8,True,394.074606 +012737aa-b210-4094-b666-af6d6677686b,OpenAI/gpt-oss-20B,together_ai,tune-mjcf,2537,11329,13866,900.050309,False,0.0,OpenAI/gpt-oss-20B,tune-mjcf,900.050309,False,0.0,False,900.050309 +8d7e07a1-69e4-4677-9beb-78756f10a8cf,gpt-5,openai,reverse-engineering,6670,7308,13978,1824.395143,False,0.0,gpt-5,reverse-engineering,1824.395143,False,0.6666666666666666,False,1824.395143 +ddd65d26-9828-4fb6-8842-5544683a07b4,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,winning-avg-corewars,16969,17121,34090,2644.987331,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,winning-avg-corewars,2644.987331,False,0.0,False,2644.987331 +ed2e77eb-5a57-4158-b278-dd2a70896713,gemini-2.5-flash,gemini,fix-code-vulnerability,9285,4540,13825,904.470365,False,0.0,gemini-2.5-flash,fix-code-vulnerability,904.470365,False,0.0,False,904.470365 +4d1ffb2d-ad00-48a6-869f-6f6418fa217f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pmars,13118,6251,19369,915.933456,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pmars,915.933456,True,1.0,True,915.933456 +85e219a4-6110-44df-a2e3-26e6a853efe8,zai-org/GLM-4.5-Air-FP8,together_ai,install-windows-3.11,7424,3028,10452,757.110773,False,0.0,zai-org/GLM-4.5-Air-FP8,install-windows-3.11,757.110773,False,0.0,False,757.110773 +a8df9ae6-5894-4908-ae10-20cf096a68ed,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,reshard-c4-data,7486,3917,11403,378.618312,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reshard-c4-data,378.618312,False,0.0,False,378.618312 +268318a5-a2ca-4f64-b5e3-33554cbd0807,gemini-2.5-pro,gemini,sanitize-git-repo,12957,1736,14693,264.145468,False,0.0,gemini-2.5-pro,sanitize-git-repo,264.145468,False,0.0,False,264.145468 +4da9c447-3511-419c-993d-fef9a35dd0cd,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,merge-diff-arc-agi-task,8444,3187,11631,168.27478,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,merge-diff-arc-agi-task,168.27478,False,0.0,False,168.27478 +8105feba-7a00-46f8-84fa-bc7d9428e84e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-leaderboard,5460,1500,6960,214.026758,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-leaderboard,214.026758,False,0.0,False,214.026758 +8aa6f73e-cd5f-4a4e-9803-79b853d93acd,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-klee-minimal,13261,2255,15516,1751.069716,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-klee-minimal,1751.069716,False,0.0,False,1751.069716 +c4d6605e-a3ad-4d4e-b910-87b7e4a27052,gemini-2.5-flash,gemini,chess-best-move,4698,7469,12167,627.610071,False,0.0,gemini-2.5-flash,chess-best-move,627.610071,False,0.0,False,627.610071 +ba4093ff-7655-40e2-9944-624782ad7916,claude-sonnet-4-20250514,anthropic,build-cython-ext,14999,5657,20656,649.676938,False,0.0,claude-sonnet-4-20250514,build-cython-ext,649.676938,False,0.0,False,649.676938 +7230fdbc-86d7-469d-9b95-079236efd67b,zai-org/GLM-4.5-Air-FP8,together_ai,dna-insert,18840,7149,25989,419.1406,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-insert,419.1406,False,0.0,False,419.1406 +3e75109c-dca6-48d8-811a-5c11cd582bfc,OpenAI/gpt-oss-20B,together_ai,break-filter-js-from-html,330,1323,1653,91.586926,False,0.0,OpenAI/gpt-oss-20B,break-filter-js-from-html,91.586926,False,0.0,False,91.586926 +7a1a3b6f-8ba9-48ce-8d62-b3efa7fdd92b,deepseek-ai/DeepSeek-V3.1,together_ai,merge-diff-arc-agi-task,18255,7006,25261,235.582091,True,1.0,deepseek-ai/DeepSeek-V3.1,merge-diff-arc-agi-task,235.582091,True,0.2,True,235.582091 +e722ba2f-8654-4ae3-804b-678cd2824d2a,OpenAI/gpt-oss-20B,together_ai,build-cython-ext,5033,22575,27608,900.344872,False,0.0,OpenAI/gpt-oss-20B,build-cython-ext,900.344872,False,0.0,False,900.344872 +c7f44e5c-d19b-45c7-8435-5ef25aeb84c1,openai/gpt-oss-120b,together_ai,large-scale-text-editing,6452,7988,14440,1243.511917,False,0.0,openai/gpt-oss-120b,large-scale-text-editing,1243.511917,False,0.0,False,1243.511917 +be1fcab7-d515-41e5-a3cf-f5fd422fd565,openai/gpt-oss-120b,together_ai,reverse-engineering,12355,9462,21817,923.221569,True,1.0,openai/gpt-oss-120b,reverse-engineering,923.221569,True,0.2,True,923.221569 +4cfcb1c8-ecc2-4140-a97a-39357b396022,gemini-2.5-pro,gemini,feal-differential-cryptanalysis,6436,6153,12589,1157.066908,True,1.0,gemini-2.5-pro,feal-differential-cryptanalysis,1157.066908,True,0.6,True,1157.066908 +b0e2f43f-19d6-4412-8a61-da781c456e4d,gemini-2.5-flash,gemini,adaptive-rejection-sampler,17375,9809,27184,906.827773,False,0.0,gemini-2.5-flash,adaptive-rejection-sampler,906.827773,False,0.0,False,906.827773 +f649f426-bf84-41c8-a076-130782763dfc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,financial-document-processor,2745,1141,3886,86.600112,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,financial-document-processor,86.600112,False,0.0,False,86.600112 +4fb4b340-ef1f-4cf7-bdab-e81ae765a07f,grok-code-fast-1,xai,video-processing,2194,1532,3726,152.243322,False,0.0,grok-code-fast-1,video-processing,152.243322,False,0.0,False,152.243322 +43b89775-8f8b-473b-9225-0f8d42d1c4df,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-klee-minimal,17687,3436,21123,803.787656,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-klee-minimal,803.787656,False,0.0,False,803.787656 +57303bba-1dfd-4066-9e6c-fddc15cebf31,gpt-5-mini,openai,sqlite-with-gcov,5903,2017,7920,299.261982,True,1.0,gpt-5-mini,sqlite-with-gcov,299.261982,True,1.0,True,299.261982 +66874905-467a-4e9d-b645-bc7fdb1f7bde,grok-4-0709,xai,hf-model-inference,3694,1432,5126,291.083538,True,1.0,grok-4-0709,hf-model-inference,291.083538,True,1.0,True,291.083538 +4de074b7-1534-4b27-b38f-53ca493e3634,gemini-2.5-pro,gemini,run-pdp11-code,10357,5523,15880,1000.576743,False,0.0,gemini-2.5-pro,run-pdp11-code,1000.576743,False,0.0,False,1000.576743 +e12bf8e9-f9f7-409e-87ff-8f5279ce8c8e,claude-opus-4-1-20250805,anthropic,merge-diff-arc-agi-task,11671,4797,16468,217.071652,True,1.0,claude-opus-4-1-20250805,merge-diff-arc-agi-task,217.071652,True,0.3333333333333333,True,217.071652 +bdd04e74-d3e7-461d-87bf-1eb0b099edaf,deepseek-ai/DeepSeek-V3.1,together_ai,model-extraction-relu-logits,5128,3792,8920,197.996922,True,1.0,deepseek-ai/DeepSeek-V3.1,model-extraction-relu-logits,197.996922,True,0.2,True,197.996922 +c1f8bae4-037c-4021-86b7-e7be4ef15c1c,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-cli,3764,4678,8442,755.537638,False,0.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-cli,755.537638,False,0.0,False,755.537638 +5d24890c-e8c7-4b64-bf3e-5d645f7280ec,grok-4-0709,xai,port-compressor,16874,27499,44373,3605.33934,False,0.0,grok-4-0709,port-compressor,3605.33934,False,0.0,False,3605.33934 +9d0b3277-b385-4924-8e40-bc9cb12e5ede,gpt-5-nano,openai,write-compressor,9085,7282,16367,907.399624,False,0.0,gpt-5-nano,write-compressor,907.399624,False,0.0,False,907.399624 +3e744871-e3a7-42ae-8c36-e15d6218105a,OpenAI/gpt-oss-20B,together_ai,merge-diff-arc-agi-task,771,1647,2418,60.228993,False,0.0,OpenAI/gpt-oss-20B,merge-diff-arc-agi-task,60.228993,False,0.0,False,60.228993 +3bed7855-83c6-4c4d-9a9d-1014281a242b,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-retrieve,1681,3486,5167,486.003296,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-retrieve,486.003296,False,0.0,False,486.003296 +61c109e3-c374-4ca8-b6a2-8aa3fdb52db8,zai-org/GLM-4.5-Air-FP8,together_ai,run-pdp11-code,8609,10156,18765,1001.108505,False,0.0,zai-org/GLM-4.5-Air-FP8,run-pdp11-code,1001.108505,False,0.0,False,1001.108505 +d6b4176b-6a74-4ad7-9760-c05bb64a5445,grok-4-0709,xai,financial-document-processor,1780,2202,3982,1225.359464,False,0.0,grok-4-0709,financial-document-processor,1225.359464,False,0.0,False,1225.359464 +fd2746ac-ebda-4090-b6f8-158ff3e5712a,gemini-2.5-pro,gemini,sqlite-db-truncate,4062,2542,6604,498.972732,False,0.0,gemini-2.5-pro,sqlite-db-truncate,498.972732,False,0.0,False,498.972732 +fa493922-de8b-413e-a8d0-ea4719ae7a60,openai/gpt-oss-120b,together_ai,build-pov-ray,34952,24929,59881,4434.340658,False,0.0,openai/gpt-oss-120b,build-pov-ray,4434.340658,False,0.0,False,4434.340658 +42d5e0be-1278-4a47-a329-7f155a2dcb62,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,code-from-image,4946,799,5745,47.011482,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,code-from-image,47.011482,True,0.4,True,47.011482 +242f6209-f7ec-4701-b499-f2de0cea1931,gemini-2.5-pro,gemini,winning-avg-corewars,15661,18058,33719,3602.992949,False,0.0,gemini-2.5-pro,winning-avg-corewars,3602.992949,False,0.0,False,3602.992949 +afdfcef2-8fee-4281-b3b3-a837923aa32b,gpt-5,openai,sparql-university,5731,2395,8126,354.514843,True,1.0,gpt-5,sparql-university,354.514843,True,0.8,True,354.514843 +0b1249b7-84df-4604-95c0-94a8ac7f2cad,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-linear-cryptanalysis,17521,16076,33597,1120.093766,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-linear-cryptanalysis,1120.093766,False,0.0,False,1120.093766 +08d6e1c2-f9d3-4165-bddd-d720993958ea,openai/gpt-oss-120b,together_ai,filter-js-from-html,1424,773,2197,59.085328,False,0.0,openai/gpt-oss-120b,filter-js-from-html,59.085328,False,0.0,False,59.085328 +11e2bc41-acf9-47c3-9e9b-ec758c61c529,OpenAI/gpt-oss-20B,together_ai,pytorch-model-cli,1093,2015,3108,89.057138,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-cli,89.057138,False,0.0,False,89.057138 +4b11afde-c593-4d2c-83df-d12f1b8008c1,claude-sonnet-4-20250514,anthropic,mteb-leaderboard,16092,6189,22281,681.757995,False,0.0,claude-sonnet-4-20250514,mteb-leaderboard,681.757995,False,0.0,False,681.757995 +e94f9f0c-e177-43cc-8b77-8abd50be1b02,moonshotai/Kimi-K2-Instruct-0905,together_ai,cancel-async-tasks,2741,2122,4863,405.314407,False,0.0,moonshotai/Kimi-K2-Instruct-0905,cancel-async-tasks,405.314407,False,0.6,False,405.314407 +760e7d17-6e86-4ecb-8b61-2997998a78d3,zai-org/GLM-4.5-Air-FP8,together_ai,install-klee-minimal,9639,2110,11749,908.220079,False,0.0,zai-org/GLM-4.5-Air-FP8,install-klee-minimal,908.220079,False,0.0,False,908.220079 +e51def54-c337-488b-ab93-403a9ac03bbd,openai/gpt-oss-120b,together_ai,sanitize-git-repo,4135,1022,5157,148.139276,False,0.0,openai/gpt-oss-120b,sanitize-git-repo,148.139276,False,0.0,False,148.139276 +ea916cad-d7d6-4e4c-9c65-695480f82964,gpt-5,openai,extract-elf,2594,3156,5750,216.97055,False,0.0,gpt-5,extract-elf,216.97055,False,0.2857142857142857,False,216.97055 +a7273f7a-24a8-4067-9630-9aaa3e3afeff,openai/gpt-oss-120b,together_ai,constraints-scheduling,4397,2695,7092,104.04398,True,1.0,openai/gpt-oss-120b,constraints-scheduling,104.04398,True,1.0,True,104.04398 +68680041-9cba-41e2-9c3f-dd96b88b2d5f,gpt-5-nano,openai,feal-differential-cryptanalysis,23865,27562,51427,1803.213401,False,0.0,gpt-5-nano,feal-differential-cryptanalysis,1803.213401,False,0.0,False,1803.213401 +c9c0b55a-49f2-46a4-8b94-ca8679010cac,gpt-5-mini,openai,circuit-fibsqrt,33391,40604,73995,3617.064916,False,0.0,gpt-5-mini,circuit-fibsqrt,3617.064916,False,0.0,False,3617.064916 +3a989814-8093-43c9-a91e-e6e657d3987e,claude-sonnet-4-20250514,anthropic,mteb-leaderboard,960,594,1554,20.98843,False,0.0,claude-sonnet-4-20250514,mteb-leaderboard,20.98843,False,0.0,False,20.98843 +4b09af71-aea2-4f2e-af72-ba09df9983d2,claude-opus-4-1-20250805,anthropic,build-initramfs-qemu,13557,5710,19267,266.960812,False,0.0,claude-opus-4-1-20250805,build-initramfs-qemu,266.960812,False,0.0,False,266.960812 +30ccf8f0-c600-42fd-9a20-bea5aa38dd30,gpt-5-nano,openai,build-initramfs-qemu,2554,5929,8483,914.449687,False,0.0,gpt-5-nano,build-initramfs-qemu,914.449687,False,0.0,False,914.449687 +6086d3d1-d440-417d-bcb1-c9ef62fa0140,OpenAI/gpt-oss-20B,together_ai,reverse-engineering,4499,28136,32635,1801.983972,False,0.0,OpenAI/gpt-oss-20B,reverse-engineering,1801.983972,False,0.0,False,1801.983972 +0e9c10ae-cd82-4afc-b329-c70d9552ec0d,claude-opus-4-1-20250805,anthropic,constraints-scheduling,5782,3624,9406,335.54073,True,1.0,claude-opus-4-1-20250805,constraints-scheduling,335.54073,True,0.8888888888888888,True,335.54073 +d412527e-84c7-460b-8524-d501c01f142b,gpt-5-nano,openai,adaptive-rejection-sampler,11742,20605,32347,902.897538,False,0.0,gpt-5-nano,adaptive-rejection-sampler,902.897538,False,0.2,False,902.897538 +89ff8175-d909-484a-9228-d523a6cd6335,openai/gpt-oss-120b,together_ai,fix-git,2527,1299,3826,261.036047,False,0.0,openai/gpt-oss-120b,fix-git,261.036047,False,0.6,False,261.036047 +2494010e-6cf2-4388-87b8-5a164f6fa909,grok-code-fast-1,xai,port-compressor,35250,15471,50721,3600.001048,False,0.0,grok-code-fast-1,port-compressor,3600.001048,False,0.0,False,3600.001048 +a141156f-5a4b-46e9-b721-5623069e0a11,gpt-5-mini,openai,pytorch-model-recovery,3727,5808,9535,297.503929,False,0.0,gpt-5-mini,pytorch-model-recovery,297.503929,False,0.0,False,297.503929 +3362673f-f8a4-4b81-aacd-c073df21690d,openai/gpt-oss-120b,together_ai,break-filter-js-from-html,2467,3726,6193,355.495715,False,0.0,openai/gpt-oss-120b,break-filter-js-from-html,355.495715,False,0.0,False,355.495715 +e7a54e35-e1c6-4406-9a95-252b8c60f21b,gemini-2.5-flash,gemini,feal-linear-cryptanalysis,8446,22877,31323,408.574574,False,0.0,gemini-2.5-flash,feal-linear-cryptanalysis,408.574574,False,0.0,False,408.574574 +30b5565a-1a21-4fdf-b65a-68bfe7e2b7e8,gpt-5-mini,openai,sqlite-db-truncate,6433,4322,10755,473.371433,False,0.0,gpt-5-mini,sqlite-db-truncate,473.371433,False,0.0,False,473.371433 +f4a58f67-209f-491e-9390-6e8faaed0192,gpt-5,openai,path-tracing,34819,32157,66976,6611.720919,False,0.0,gpt-5,path-tracing,6611.720919,False,0.0,False,6611.720919 +6c0e03f8-62d1-41b9-974f-01cf02b5784e,grok-4-0709,xai,feal-differential-cryptanalysis,2528,2708,5236,811.234777,True,1.0,grok-4-0709,feal-differential-cryptanalysis,811.234777,True,0.8,True,811.234777 +fa8cec37-d931-4136-ad63-0403853da8ae,OpenAI/gpt-oss-20B,together_ai,reshard-c4-data,1996,1902,3898,122.426137,False,0.0,OpenAI/gpt-oss-20B,reshard-c4-data,122.426137,False,0.0,False,122.426137 +dcf0bfc4-fcd7-43f0-933d-6ec7de023f13,gpt-5-nano,openai,write-compressor,18109,10399,28508,903.472232,False,0.0,gpt-5-nano,write-compressor,903.472232,False,0.0,False,903.472232 +6cba3f53-e365-4a02-90fb-79517d752af0,grok-code-fast-1,xai,fix-ocaml-gc,18814,6043,24857,1485.734256,False,0.0,grok-code-fast-1,fix-ocaml-gc,1485.734256,False,0.0,False,1485.734256 +1cd09a7e-a926-42d3-872b-7ee45441cd78,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-db-truncate,5538,4428,9966,290.578305,False,0.0,deepseek-ai/DeepSeek-V3.1,sqlite-db-truncate,290.578305,False,0.0,False,290.578305 +da970409-acf6-4732-9876-2e7b5b18c88a,grok-code-fast-1,xai,build-pmars,11561,3184,14745,482.589914,True,1.0,grok-code-fast-1,build-pmars,482.589914,True,0.8,True,482.589914 +a34b2203-8a62-47ca-8d25-28da78aed828,gpt-5-mini,openai,adaptive-rejection-sampler,6815,18711,25526,900.006354,True,1.0,gpt-5-mini,adaptive-rejection-sampler,900.006354,True,0.4,True,900.006354 +a6589e35-a4b3-4b7c-a093-d3757a8b52f2,grok-4-0709,xai,mteb-leaderboard,927,393,1320,330.339313,False,0.0,grok-4-0709,mteb-leaderboard,330.339313,False,0.0,False,330.339313 +80a8b87c-8828-45a0-b7a4-84c875a8d38c,deepseek-ai/DeepSeek-V3.1,together_ai,port-compressor,66729,43976,110705,3606.337451,False,0.0,deepseek-ai/DeepSeek-V3.1,port-compressor,3606.337451,False,0.0,False,3606.337451 +08a2960c-f3db-4aca-a129-0affc8c1a792,gemini-2.5-pro,gemini,sparql-university,5502,1868,7370,1011.935806,True,1.0,gemini-2.5-pro,sparql-university,1011.935806,True,0.6,True,1011.935806 +a6758dfd-81fb-4284-9ffa-61ba5dbe32e4,zai-org/GLM-4.5-Air-FP8,together_ai,distribution-search,11568,11977,23545,877.421695,False,0.0,zai-org/GLM-4.5-Air-FP8,distribution-search,877.421695,False,0.0,False,877.421695 +6c28df03-b3fe-41cc-9a5d-86278cb896f2,zai-org/GLM-4.5-Air-FP8,together_ai,install-klee-minimal,7530,2865,10395,913.315869,False,0.0,zai-org/GLM-4.5-Air-FP8,install-klee-minimal,913.315869,False,0.0,False,913.315869 +01d0bbdd-6daa-4b1d-9b79-544240346808,gemini-2.5-pro,gemini,pypi-server,8099,3129,11228,630.920116,True,1.0,gemini-2.5-pro,pypi-server,630.920116,True,0.8,True,630.920116 +be62c2d2-27b9-4312-a6e5-92de5f442a40,gpt-5-mini,openai,db-wal-recovery,7433,14925,22358,901.020909,False,0.0,gpt-5-mini,db-wal-recovery,901.020909,False,0.0,False,901.020909 +6cdfd015-430d-4038-a4d0-a40c82d16fd2,claude-sonnet-4-20250514,anthropic,configure-git-webserver,7371,2613,9984,513.829686,False,0.0,claude-sonnet-4-20250514,configure-git-webserver,513.829686,False,0.6,False,513.829686 +d3482749-e71e-4ef4-bf2d-31898f7ce488,zai-org/GLM-4.5-Air-FP8,together_ai,train-fasttext,84134,19730,103864,3600.002575,False,0.0,zai-org/GLM-4.5-Air-FP8,train-fasttext,3600.002575,False,0.2,False,3600.002575 +5140980b-cefa-44e9-9629-efd7676146e4,OpenAI/gpt-oss-20B,together_ai,path-tracing-reverse,871,1341,2212,89.028523,False,0.0,OpenAI/gpt-oss-20B,path-tracing-reverse,89.028523,False,0.0,False,89.028523 +96fcd209-7c8e-4aeb-bf4f-e338ed706b7e,gpt-5-nano,openai,qemu-startup,22921,4769,27690,900.068942,False,0.0,gpt-5-nano,qemu-startup,900.068942,False,0.0,False,900.068942 +306f1740-3fca-41cc-a41c-61a286cbdbbd,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing-reverse,27171,12393,39564,1824.024906,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing-reverse,1824.024906,False,0.0,False,1824.024906 +fe83ebc1-3ff7-4def-82dd-e60808bb20a7,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-db-truncate,6189,4747,10936,900.063573,False,0.0,deepseek-ai/DeepSeek-V3.1,sqlite-db-truncate,900.063573,False,0.0,False,900.063573 +7e5a95f3-f02b-4dc6-a83b-9409f7ed21c3,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-differential-cryptanalysis,25148,31859,57007,1348.891886,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-differential-cryptanalysis,1348.891886,False,0.0,False,1348.891886 +3460bc75-a208-4ce6-a53e-ced1a201f24c,deepseek-ai/DeepSeek-V3.1,together_ai,configure-git-webserver,5824,1573,7397,237.602154,True,1.0,deepseek-ai/DeepSeek-V3.1,configure-git-webserver,237.602154,True,1.0,True,237.602154 +9233f01e-96b1-475e-bdc5-99459abc838a,claude-sonnet-4-20250514,anthropic,adaptive-rejection-sampler,14445,11157,25602,913.14035,False,0.0,claude-sonnet-4-20250514,adaptive-rejection-sampler,913.14035,False,0.0,False,913.14035 +ece7e9bc-7f65-4019-8991-e8c7a22a0796,gpt-5,openai,model-extraction-relu-logits,3375,2609,5984,96.777411,False,0.0,gpt-5,model-extraction-relu-logits,96.777411,False,0.1666666666666666,False,96.777411 +11293f0f-1997-498c-b84a-af00a7eb8ab5,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,count-dataset-tokens,14520,5132,19652,740.905576,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,count-dataset-tokens,740.905576,False,0.0,False,740.905576 +8452678e-763f-4333-afff-48fe64f6082d,grok-code-fast-1,xai,break-filter-js-from-html,1924,1398,3322,299.814663,False,0.0,grok-code-fast-1,break-filter-js-from-html,299.814663,False,0.0,False,299.814663 +1a58bf97-4d56-4c0b-8576-585d0a72d078,moonshotai/Kimi-K2-Instruct-0905,together_ai,crack-7z-hash,9490,3990,13480,312.902691,True,1.0,moonshotai/Kimi-K2-Instruct-0905,crack-7z-hash,312.902691,True,1.0,True,312.902691 +b8413636-42b0-4b7e-9f02-006bf9813646,gpt-5,openai,write-compressor,9136,9331,18467,817.941795,True,1.0,gpt-5,write-compressor,817.941795,True,0.3333333333333333,True,817.941795 +cd7e45fd-cb30-4f4c-a2fd-819027102a24,deepseek-ai/DeepSeek-V3.1,together_ai,adaptive-rejection-sampler,9571,9871,19442,921.045348,False,0.0,deepseek-ai/DeepSeek-V3.1,adaptive-rejection-sampler,921.045348,False,0.2,False,921.045348 +7a594bb1-d629-4dfb-988a-5438205bb1b1,gpt-5-nano,openai,pytorch-model-cli,10328,4536,14864,237.045804,False,0.0,gpt-5-nano,pytorch-model-cli,237.045804,False,0.0,False,237.045804 +9e97df51-00bf-4537-a05b-52e81406872f,openai/gpt-oss-120b,together_ai,hf-model-inference,2432,1491,3923,432.93709,False,0.0,openai/gpt-oss-120b,hf-model-inference,432.93709,False,0.0,False,432.93709 +15d9a81e-836e-49a9-ad13-08b3474f03be,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,configure-git-webserver,5006,1132,6138,249.225807,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,configure-git-webserver,249.225807,True,0.6,True,249.225807 +ba2b9534-3641-4305-b940-d2ac1e7b3bd7,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-windows-3.11,8398,3555,11953,237.833925,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-windows-3.11,237.833925,False,0.0,False,237.833925 +f606f3a7-6266-4c9b-a396-2342709cf3dd,gemini-2.5-flash,gemini,qemu-alpine-ssh,2973,6331,9304,902.515037,False,0.0,gemini-2.5-flash,qemu-alpine-ssh,902.515037,False,0.0,False,902.515037 +72b2b9e6-09af-4650-93bc-9971a8660491,OpenAI/gpt-oss-20B,together_ai,count-dataset-tokens,1033,1641,2674,250.126521,False,0.0,OpenAI/gpt-oss-20B,count-dataset-tokens,250.126521,False,0.0,False,250.126521 +a628dc9f-e642-4e48-a358-03e66c2a5d9f,gpt-5-mini,openai,make-mips-interpreter,7460,10585,18045,1808.065558,False,0.0,gpt-5-mini,make-mips-interpreter,1808.065558,False,0.0,False,1808.065558 +c38caa6f-3413-41de-a0cc-32b74ba3df61,gpt-5-nano,openai,openssl-selfsigned-cert,7148,7456,14604,631.43602,True,1.0,gpt-5-nano,openssl-selfsigned-cert,631.43602,True,0.6,True,631.43602 +8cc8d520-557a-4e13-89c2-fd21ada68f2b,claude-sonnet-4-20250514,anthropic,sparql-university,12088,7689,19777,663.421862,False,0.0,claude-sonnet-4-20250514,sparql-university,663.421862,False,0.0,False,663.421862 +7eb30c3d-3cca-4767-8f0c-3b5178e84dda,gpt-5-mini,openai,merge-diff-arc-agi-task,4420,4809,9229,247.340679,True,1.0,gpt-5-mini,merge-diff-arc-agi-task,247.340679,True,0.4,True,247.340679 +61c6711c-c079-4f82-8c38-a34fb167d390,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sparql-university,8085,4306,12391,242.737937,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sparql-university,242.737937,False,0.0,False,242.737937 +2074395e-72ba-495c-aac3-52cb348aaefb,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-leaderboard,19533,2989,22522,296.550172,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-leaderboard,296.550172,False,0.0,False,296.550172 +0755df59-ef1d-41bb-a1fb-d251cf47523e,claude-opus-4-1-20250805,anthropic,fix-code-vulnerability,12413,5276,17689,295.388928,False,0.0,claude-opus-4-1-20250805,fix-code-vulnerability,295.388928,False,0.125,False,295.388928 +88f73130-4828-4fdf-9c42-75e7d1c2f818,moonshotai/Kimi-K2-Instruct-0905,together_ai,financial-document-processor,18464,10367,28831,1204.663633,False,0.0,moonshotai/Kimi-K2-Instruct-0905,financial-document-processor,1204.663633,False,0.0,False,1204.663633 +744de146-7724-4b53-acea-752d69c10461,grok-4-0709,xai,sqlite-with-gcov,8898,1803,10701,491.128847,False,0.0,grok-4-0709,sqlite-with-gcov,491.128847,False,0.0,False,491.128847 +180ef646-0896-48be-96db-f96a58ff4dcb,zai-org/GLM-4.5-Air-FP8,together_ai,build-initramfs-qemu,7233,7723,14956,909.26996,False,0.0,zai-org/GLM-4.5-Air-FP8,build-initramfs-qemu,909.26996,False,0.0,False,909.26996 +3c351a24-993d-4606-b41b-428d27d3c4ae,claude-sonnet-4-20250514,anthropic,install-windows-3.11,10018,4679,14697,446.727689,False,0.0,claude-sonnet-4-20250514,install-windows-3.11,446.727689,False,0.0,False,446.727689 +fec93a22-3d7f-4957-af2d-7ff66628cd40,grok-4-0709,xai,polyglot-rust-c,1351,1118,2469,746.174398,False,0.0,grok-4-0709,polyglot-rust-c,746.174398,False,0.0,False,746.174398 +b0173bb2-013c-4542-b3ee-9fc316f66109,deepseek-ai/DeepSeek-V3.1,together_ai,extract-elf,6101,3772,9873,319.546535,False,0.0,deepseek-ai/DeepSeek-V3.1,extract-elf,319.546535,False,0.6,False,319.546535 +53aff598-a8bc-4185-9886-e7358a8e4855,gpt-5-nano,openai,dna-assembly,11237,8759,19996,720.48179,False,0.0,gpt-5-nano,dna-assembly,720.48179,False,0.0,False,720.48179 +f6a957e6-f4fb-402c-b3eb-fd046460d669,gpt-5,openai,reshard-c4-data,2136,4968,7104,900.001721,True,1.0,gpt-5,reshard-c4-data,900.001721,True,0.3333333333333333,True,900.001721 +b19c5622-fbda-49e0-850b-83df83360911,gemini-2.5-flash,gemini,bn-fit-modify,25065,20145,45210,3608.480334,False,0.0,gemini-2.5-flash,bn-fit-modify,3608.480334,False,0.0,False,3608.480334 +cf5c2cd8-43c5-416b-a586-96427ffaa0d8,gpt-5-mini,openai,vulnerable-secret,5352,7583,12935,904.657216,False,0.0,gpt-5-mini,vulnerable-secret,904.657216,False,0.4,False,904.657216 +ca57e394-4100-407f-bb74-c786c14b52ed,claude-opus-4-1-20250805,anthropic,openssl-selfsigned-cert,3327,2689,6016,106.913432,True,1.0,claude-opus-4-1-20250805,openssl-selfsigned-cert,106.913432,True,1.0,True,106.913432 +bc06179e-f63f-4b42-8e3d-517056c0f246,claude-sonnet-4-20250514,anthropic,count-dataset-tokens,8038,1611,9649,903.145696,False,0.0,claude-sonnet-4-20250514,count-dataset-tokens,903.145696,False,0.0,False,903.145696 +ab0f99bb-4d7f-4c79-b44d-07f86e76514a,claude-opus-4-1-20250805,anthropic,dna-insert,11558,6622,18180,219.451668,False,0.0,claude-opus-4-1-20250805,dna-insert,219.451668,False,0.0,False,219.451668 +daebf798-83c0-43d4-8c1c-991bd40fe682,grok-4-0709,xai,pypi-server,2680,2092,4772,364.268693,False,0.0,grok-4-0709,pypi-server,364.268693,False,0.4,False,364.268693 +7b5f3c52-ed5d-4e94-bd10-04944d2fafa3,OpenAI/gpt-oss-20B,together_ai,port-compressor,13294,46269,59563,3600.001354,False,0.0,OpenAI/gpt-oss-20B,port-compressor,3600.001354,False,0.0,False,3600.001354 +65c308bb-ba53-4cce-8a9d-400f723ecaf7,zai-org/GLM-4.5-Air-FP8,together_ai,gpt2-codegolf,14966,14528,29494,857.213558,False,0.0,zai-org/GLM-4.5-Air-FP8,gpt2-codegolf,857.213558,False,0.0,False,857.213558 +db6da5a7-058a-4629-8e7f-fc363c46ca1d,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-cli,12552,4555,17107,902.028783,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-cli,902.028783,False,0.0,False,902.028783 +e59958ca-45a7-49c9-aae9-400727717c94,grok-code-fast-1,xai,prove-plus-comm,1309,1402,2711,120.692465,False,0.0,grok-code-fast-1,prove-plus-comm,120.692465,False,0.4,False,120.692465 +d6f11601-42ba-4b67-9836-e28c3012b091,grok-4-0709,xai,cancel-async-tasks,1106,478,1584,151.319581,False,0.0,grok-4-0709,cancel-async-tasks,151.319581,False,0.0,False,151.319581 +741f502d-7463-49ee-a2dd-4010804303b5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,form-filling,4581,3281,7862,781.053363,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,form-filling,781.053363,False,0.0,False,781.053363 +740ccc3f-2bab-4d1b-a3c5-08734da0daca,claude-opus-4-1-20250805,anthropic,git-leak-recovery,2459,1614,4073,85.344766,True,1.0,claude-opus-4-1-20250805,git-leak-recovery,85.344766,True,1.0,True,85.344766 +8d6e1a2c-550d-4f42-9d43-32e0532a60da,claude-sonnet-4-20250514,anthropic,hf-model-inference,6383,3670,10053,509.279584,False,0.0,claude-sonnet-4-20250514,hf-model-inference,509.279584,False,0.2,False,509.279584 +22eb9328-282e-4bf9-84c1-a46f90d9299e,grok-4-0709,xai,form-filling,5435,4024,9459,502.933091,True,1.0,grok-4-0709,form-filling,502.933091,True,0.2,True,502.933091 +8ee45d2f-2056-4400-b3ac-af56b68be3ec,grok-4-0709,xai,fix-code-vulnerability,5934,4212,10146,900.848946,True,1.0,grok-4-0709,fix-code-vulnerability,900.848946,True,0.2,True,900.848946 +dcbf9b3d-13d8-485e-b37b-c163f959fa15,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-windows-3.11,12630,8842,21472,530.472989,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-windows-3.11,530.472989,False,0.0,False,530.472989 +36f1367f-d655-41a7-b322-4ea5f1cffa6b,gpt-5-mini,openai,openssl-selfsigned-cert,2193,2683,4876,218.155395,True,1.0,gpt-5-mini,openssl-selfsigned-cert,218.155395,True,0.8,True,218.155395 +51221b1b-da66-43fe-972f-c28097569394,gemini-2.5-pro,gemini,wasm-pipeline,9778,2590,12368,404.091312,False,0.0,gemini-2.5-pro,wasm-pipeline,404.091312,False,0.0,False,404.091312 +200db22f-b194-4bd7-9485-a799febbf2db,claude-opus-4-1-20250805,anthropic,cobol-modernization,5342,2930,8272,919.19774,True,1.0,claude-opus-4-1-20250805,cobol-modernization,919.19774,True,0.875,True,919.19774 +8c31613f-334d-4ba5-8540-e574dfbd92d9,grok-4-0709,xai,fix-code-vulnerability,9803,4353,14156,994.054723,False,0.0,grok-4-0709,fix-code-vulnerability,994.054723,False,0.2,False,994.054723 +306a7098-d31a-4d50-ada2-8515ece2562f,OpenAI/gpt-oss-20B,together_ai,train-fasttext,1885,2489,4374,1764.887709,False,0.0,OpenAI/gpt-oss-20B,train-fasttext,1764.887709,False,0.0,False,1764.887709 +f59ad4df-ecb8-4e78-a851-ac3693341911,zai-org/GLM-4.5-Air-FP8,together_ai,build-cython-ext,20721,6148,26869,900.027686,False,0.0,zai-org/GLM-4.5-Air-FP8,build-cython-ext,900.027686,False,0.0,False,900.027686 +e90c74f8-8785-42e4-97cf-b377cc708d7d,OpenAI/gpt-oss-20B,together_ai,gpt2-codegolf,956,294,1250,10.965606,False,0.0,OpenAI/gpt-oss-20B,gpt2-codegolf,10.965606,False,0.0,False,10.965606 +fa2f8c5e-cec5-45e3-9e45-890fb2452cbc,moonshotai/Kimi-K2-Instruct-0905,together_ai,wasm-pipeline,11155,2624,13779,946.478056,False,0.0,moonshotai/Kimi-K2-Instruct-0905,wasm-pipeline,946.478056,False,0.2,False,946.478056 +1cfce4b8-cfdf-408a-acf7-c3b9497cbb72,gpt-5-mini,openai,fix-git,4471,2384,6855,330.479175,True,1.0,gpt-5-mini,fix-git,330.479175,True,0.6,True,330.479175 +79d8264a-f5c3-443f-87e4-d7ecee3c561d,claude-sonnet-4-20250514,anthropic,pytorch-model-recovery,12888,4378,17266,443.183093,True,1.0,claude-sonnet-4-20250514,pytorch-model-recovery,443.183093,True,1.0,True,443.183093 +f46a9e2c-062e-410d-9d24-35c0e93b868f,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-klee-minimal,10833,2489,13322,931.848327,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-klee-minimal,931.848327,False,0.0,False,931.848327 +cf09e239-52ba-4487-bd57-7bda44ceab33,grok-4-0709,xai,reshard-c4-data,4093,3261,7354,906.846254,False,0.0,grok-4-0709,reshard-c4-data,906.846254,False,0.0,False,906.846254 +6b61bf73-d2ea-416e-9a77-37fcac2543da,grok-4-0709,xai,sanitize-git-repo,8280,2047,10327,516.96535,False,0.0,grok-4-0709,sanitize-git-repo,516.96535,False,0.0,False,516.96535 +1a6b4329-8863-402a-b411-4774d0a93382,grok-4-0709,xai,build-pmars,8440,3410,11850,901.455583,False,0.0,grok-4-0709,build-pmars,901.455583,False,0.2,False,901.455583 +91aebae0-0889-4e7c-b509-59d9dd0a837d,gemini-2.5-flash,gemini,nginx-request-logging,3899,1680,5579,79.144991,False,0.0,gemini-2.5-flash,nginx-request-logging,79.144991,False,0.0,False,79.144991 +911b0fa0-b953-46ba-b240-c98cdb1e7c56,zai-org/GLM-4.5-Air-FP8,together_ai,regex-log,614,3092,3706,330.257806,False,0.0,zai-org/GLM-4.5-Air-FP8,regex-log,330.257806,False,0.2,False,330.257806 +de70038d-df71-4088-88cf-dad0dab039bb,claude-opus-4-1-20250805,anthropic,install-windows-3.11,8953,3127,12080,267.745773,False,0.0,claude-opus-4-1-20250805,install-windows-3.11,267.745773,False,0.0,False,267.745773 +0946432d-d373-486b-816e-770ebdb4998b,gemini-2.5-pro,gemini,sqlite-db-truncate,3876,2475,6351,742.907514,False,0.0,gemini-2.5-pro,sqlite-db-truncate,742.907514,False,0.0,False,742.907514 +068b22e5-4ec3-4ff9-bd5b-fc2229c75dc6,grok-4-0709,xai,gpt2-codegolf,1097,571,1668,200.419406,False,0.0,grok-4-0709,gpt2-codegolf,200.419406,False,0.0,False,200.419406 +b0adb040-ac27-4b1c-bb74-26ab77a88328,gpt-5,openai,install-windows-3.11,4794,1910,6704,1094.848031,False,0.0,gpt-5,install-windows-3.11,1094.848031,False,0.0,False,1094.848031 +9a631723-ce2f-4fca-9639-65bcee16011a,grok-code-fast-1,xai,count-dataset-tokens,9289,2374,11663,340.246446,False,0.0,grok-code-fast-1,count-dataset-tokens,340.246446,False,0.0,False,340.246446 +b0a6ac8e-5c70-4a73-b11f-022db4f66eae,OpenAI/gpt-oss-20B,together_ai,constraints-scheduling,1512,1855,3367,192.806271,False,0.0,OpenAI/gpt-oss-20B,constraints-scheduling,192.806271,False,0.2,False,192.806271 +4d43befe-7cf9-406a-9aec-36fbdea7bc47,grok-4-0709,xai,large-scale-text-editing,1668,890,2558,384.673622,False,0.0,grok-4-0709,large-scale-text-editing,384.673622,False,0.4,False,384.673622 +6dd8dd37-af93-4da9-a56e-f981c0f6851e,grok-4-0709,xai,fix-ocaml-gc,29522,13652,43174,3602.41715,False,0.0,grok-4-0709,fix-ocaml-gc,3602.41715,False,0.0,False,3602.41715 +4eed7fe9-f3bc-415e-8e20-47e7d14fec5a,gpt-5-mini,openai,nginx-request-logging,3905,1957,5862,285.525567,True,1.0,gpt-5-mini,nginx-request-logging,285.525567,True,0.4,True,285.525567 +06915318-5cc7-450a-a044-5bb02368200d,gemini-2.5-flash,gemini,extract-elf,4118,2015,6133,164.870108,True,1.0,gemini-2.5-flash,extract-elf,164.870108,True,0.4,True,164.870108 +a62b93c8-943a-4e5d-8172-6feea1c1b309,gpt-5-nano,openai,schemelike-metacircular-eval,13784,27969,41753,2407.831533,False,0.0,gpt-5-nano,schemelike-metacircular-eval,2407.831533,False,0.2,False,2407.831533 +9268506e-45bf-4157-8513-26dd0f6c57c1,OpenAI/gpt-oss-20B,together_ai,financial-document-processor,458,1336,1794,128.282891,False,0.0,OpenAI/gpt-oss-20B,financial-document-processor,128.282891,False,0.0,False,128.282891 +70cffa09-6399-42a2-9e3d-008fbd1235c2,OpenAI/gpt-oss-20B,together_ai,write-compressor,849,502,1351,1240.835153,False,0.0,OpenAI/gpt-oss-20B,write-compressor,1240.835153,False,0.0,False,1240.835153 +93f981af-778f-42d2-967e-db8f6bf96c44,grok-code-fast-1,xai,circuit-fibsqrt,5624,3664,9288,356.702902,False,0.0,grok-code-fast-1,circuit-fibsqrt,356.702902,False,0.0,False,356.702902 +1d01d2fa-42fd-4fc5-b808-38af1c5778c0,gpt-5,openai,git-leak-recovery,2351,1719,4070,280.969164,True,1.0,gpt-5,git-leak-recovery,280.969164,True,0.7142857142857143,True,280.969164 +f47bbcd0-0dc1-4b82-a0c9-f589ed8a8e5e,gpt-5-nano,openai,financial-document-processor,3590,4116,7706,1225.38529,False,0.0,gpt-5-nano,financial-document-processor,1225.38529,False,0.0,False,1225.38529 +3ceb6ac7-016e-4a9c-8d7e-f0fe68778ed2,gpt-5,openai,distribution-search,4316,3297,7613,148.571519,True,1.0,gpt-5,distribution-search,148.571519,True,1.0,True,148.571519 +4c465ca1-4bcf-417b-b1ba-fd2a19241a3c,openai/gpt-oss-120b,together_ai,bn-fit-modify,7239,5954,13193,388.341266,True,1.0,openai/gpt-oss-120b,bn-fit-modify,388.341266,True,0.2,True,388.341266 +9b9f8148-5bb0-4f82-be14-16099f5bf93e,deepseek-ai/DeepSeek-V3.1,together_ai,install-windows-3.11,7344,2703,10047,183.731293,False,0.0,deepseek-ai/DeepSeek-V3.1,install-windows-3.11,183.731293,False,0.0,False,183.731293 +30ca15c5-20ba-4359-82b9-bc846cbb8d77,claude-sonnet-4-20250514,anthropic,fix-git,3538,2405,5943,275.255393,True,1.0,claude-sonnet-4-20250514,fix-git,275.255393,True,1.0,True,275.255393 +0e5549d3-3346-4946-9b1c-b82839b84a22,gemini-2.5-flash,gemini,fix-code-vulnerability,28566,13870,42436,900.057884,False,0.0,gemini-2.5-flash,fix-code-vulnerability,900.057884,False,0.0,False,900.057884 +f4e0a6c6-7226-4bfd-87e9-0ea53c38e392,moonshotai/Kimi-K2-Instruct-0905,together_ai,video-processing,8538,9279,17817,499.243593,False,0.0,moonshotai/Kimi-K2-Instruct-0905,video-processing,499.243593,False,0.0,False,499.243593 +15a973d3-6470-4dcd-ac6a-5a624c94980d,gpt-5-nano,openai,build-initramfs-qemu,9487,6676,16163,902.49105,False,0.0,gpt-5-nano,build-initramfs-qemu,902.49105,False,0.0,False,902.49105 +3df36c48-c757-47f8-a4fa-ec2c58162411,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing,10640,9658,20298,573.872056,False,0.0,deepseek-ai/DeepSeek-V3.1,path-tracing,573.872056,False,0.0,False,573.872056 +8863cd87-0e4c-464e-b33e-c2fe56704274,gpt-5,openai,log-summary-date-ranges,5588,1715,7303,109.220249,False,0.0,gpt-5,log-summary-date-ranges,109.220249,False,0.0,False,109.220249 +96664f21-195e-4a7f-903d-46ec1162f93a,zai-org/GLM-4.5-Air-FP8,together_ai,dna-assembly,20214,6585,26799,722.096251,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-assembly,722.096251,False,0.0,False,722.096251 +a6afc17a-ec75-4d7d-a800-1ae095eeede6,gemini-2.5-pro,gemini,openssl-selfsigned-cert,3320,2366,5686,204.034046,False,0.0,gemini-2.5-pro,openssl-selfsigned-cert,204.034046,False,0.6,False,204.034046 +99e8d69c-0ab0-4634-80d7-8b00781584ad,claude-opus-4-1-20250805,anthropic,mteb-retrieve,2591,1437,4028,226.049896,False,0.0,claude-opus-4-1-20250805,mteb-retrieve,226.049896,False,0.0,False,226.049896 +21116792-02f2-448d-a096-6c493e3dae40,gpt-5-mini,openai,feal-differential-cryptanalysis,2274,1342,3616,246.990724,False,0.0,gpt-5-mini,feal-differential-cryptanalysis,246.990724,False,0.0,False,246.990724 +7df3ba0c-109b-4dab-8d0b-ea0bb74ee875,deepseek-ai/DeepSeek-V3.1,together_ai,run-pdp11-code,5504,2166,7670,1002.31305,False,0.0,deepseek-ai/DeepSeek-V3.1,run-pdp11-code,1002.31305,False,0.0,False,1002.31305 +cebc15ff-5382-4b44-a166-ca69347a3ba4,gemini-2.5-flash,gemini,adaptive-rejection-sampler,13101,34520,47621,917.145767,False,0.0,gemini-2.5-flash,adaptive-rejection-sampler,917.145767,False,0.0,False,917.145767 +bbee7837-49da-4fba-be76-0fcd667ea4b9,gpt-5-nano,openai,adaptive-rejection-sampler,5834,6438,12272,900.491184,False,0.0,gpt-5-nano,adaptive-rejection-sampler,900.491184,False,0.2,False,900.491184 +c46ca70b-7d11-484c-b1f4-880a6ae0029b,grok-4-0709,xai,make-doom-for-mips,19346,3489,22835,762.002849,False,0.0,grok-4-0709,make-doom-for-mips,762.002849,False,0.0,False,762.002849 +30145c9c-5e21-4eca-93ff-7e627799214b,grok-4-0709,xai,write-compressor,1468,694,2162,900.477512,False,0.0,grok-4-0709,write-compressor,900.477512,False,0.0,False,900.477512 +3f4892b4-06c7-4cef-8173-5e86a83870ca,claude-sonnet-4-20250514,anthropic,make-doom-for-mips,8884,1505,10389,1139.812455,False,0.0,claude-sonnet-4-20250514,make-doom-for-mips,1139.812455,False,0.0,False,1139.812455 +7d3aaf4d-cfd0-4ddd-96a1-3051d7006ac7,deepseek-ai/DeepSeek-V3.1,together_ai,gpt2-codegolf,5656,5838,11494,906.423934,False,0.0,deepseek-ai/DeepSeek-V3.1,gpt2-codegolf,906.423934,False,0.0,False,906.423934 +5c7984d6-e2ef-41b4-910a-1e26c15e161a,zai-org/GLM-4.5-Air-FP8,together_ai,hf-model-inference,4919,4153,9072,214.834857,True,1.0,zai-org/GLM-4.5-Air-FP8,hf-model-inference,214.834857,True,0.8,True,214.834857 +f7ce9acf-1cf6-4572-8703-d60472b19b0e,gemini-2.5-flash,gemini,fix-ocaml-gc,44712,40895,85607,3600.024888,False,0.0,gemini-2.5-flash,fix-ocaml-gc,3600.024888,False,0.0,False,3600.024888 +944582c8-707e-4b74-891b-c763a689827c,grok-4-0709,xai,write-compressor,796,396,1192,908.163267,False,0.0,grok-4-0709,write-compressor,908.163267,False,0.0,False,908.163267 +aae8953f-6f75-4525-81d3-57317d7c935d,claude-sonnet-4-20250514,anthropic,build-pmars,13016,4176,17192,903.979358,False,0.0,claude-sonnet-4-20250514,build-pmars,903.979358,False,0.6,False,903.979358 +14513e5c-1d1b-490c-95f8-6629a680a73d,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-recovery,18181,16373,34554,912.530928,False,0.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-recovery,912.530928,False,0.4,False,912.530928 +c21fcb54-3feb-4fc9-8a2e-f7124ea72623,gpt-5,openai,prove-plus-comm,3271,3532,6803,370.875792,True,1.0,gpt-5,prove-plus-comm,370.875792,True,0.8571428571428571,True,370.875792 +f5e368ff-0c49-4219-8bce-bf96656ec774,gpt-5-nano,openai,extract-elf,5426,914,6340,144.633765,False,0.0,gpt-5-nano,extract-elf,144.633765,False,0.2,False,144.633765 +89055f67-1b67-40b3-bdf9-97efb99e91bf,moonshotai/Kimi-K2-Instruct-0905,together_ai,count-dataset-tokens,9147,4560,13707,729.314036,False,0.0,moonshotai/Kimi-K2-Instruct-0905,count-dataset-tokens,729.314036,False,0.2,False,729.314036 +dad2e1e9-306e-4c4f-b05c-93f924c4992b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,openssl-selfsigned-cert,4237,3308,7545,715.499315,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,openssl-selfsigned-cert,715.499315,False,0.4,False,715.499315 +15a16daa-0e26-4476-a624-60b230504850,gemini-2.5-flash,gemini,openssl-selfsigned-cert,2893,1909,4802,189.281763,False,0.0,gemini-2.5-flash,openssl-selfsigned-cert,189.281763,False,0.0,False,189.281763 +68b616a2-5897-4f6a-8e3e-779f95e1bcc8,gpt-5,openai,path-tracing,26641,27059,53700,1800.009502,False,0.0,gpt-5,path-tracing,1800.009502,False,0.0,False,1800.009502 +c1074f82-7eed-4300-91dc-6076e76b1e38,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-cli,7253,8283,15536,732.154506,False,0.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-cli,732.154506,False,0.0,False,732.154506 +b8db87c7-883d-407f-8e47-442a9d4d9ab3,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,count-dataset-tokens,13174,3223,16397,920.348228,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,count-dataset-tokens,920.348228,False,0.0,False,920.348228 +f1ab02d9-2e8f-4016-9adb-a0aa62fe91f5,grok-code-fast-1,xai,prove-plus-comm,3084,6377,9461,871.183531,False,0.0,grok-code-fast-1,prove-plus-comm,871.183531,False,0.4,False,871.183531 +406de4ef-6bb1-4608-97d9-10fc1834b3e0,gpt-5-mini,openai,db-wal-recovery,4993,4100,9093,343.972251,False,0.0,gpt-5-mini,db-wal-recovery,343.972251,False,0.0,False,343.972251 +a642e599-09ef-478e-8be8-31183a6cd191,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-leaderboard,2374,1901,4275,190.981321,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-leaderboard,190.981321,False,0.0,False,190.981321 +d0598434-de08-40ad-b769-c5f1234561a9,zai-org/GLM-4.5-Air-FP8,together_ai,adaptive-rejection-sampler,11034,12516,23550,903.992176,False,0.0,zai-org/GLM-4.5-Air-FP8,adaptive-rejection-sampler,903.992176,False,0.0,False,903.992176 +7fe73d27-fcbe-4ea0-8a3b-14b5e50aa7ae,zai-org/GLM-4.5-Air-FP8,together_ai,build-pmars,16417,7169,23586,792.382754,True,1.0,zai-org/GLM-4.5-Air-FP8,build-pmars,792.382754,True,0.6,True,792.382754 +f4ab7d8d-4c1f-439c-95bb-fb3bdfea7197,gemini-2.5-pro,gemini,form-filling,6298,4420,10718,215.428702,False,0.0,gemini-2.5-pro,form-filling,215.428702,False,0.2,False,215.428702 +3047ae54-efed-4b96-8549-4751dffdb665,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,train-fasttext,26921,8846,35767,3600.005859,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,train-fasttext,3600.005859,False,0.0,False,3600.005859 +5130b763-6a79-4f2f-9081-7479fdcc89eb,claude-opus-4-1-20250805,anthropic,filter-js-from-html,10932,10833,21765,497.97139,False,0.0,claude-opus-4-1-20250805,filter-js-from-html,497.97139,False,0.0,False,497.97139 +af94516c-8e30-433b-9281-2445048c3173,grok-code-fast-1,xai,install-klee-minimal,8304,2631,10935,900.001959,False,0.0,grok-code-fast-1,install-klee-minimal,900.001959,False,0.0,False,900.001959 +14febac8-9296-4e61-9de1-0191f1e780bd,zai-org/GLM-4.5-Air-FP8,together_ai,write-compressor,19179,18679,37858,909.351836,False,0.0,zai-org/GLM-4.5-Air-FP8,write-compressor,909.351836,False,0.0,False,909.351836 +b95dc6a4-4397-45b5-88b3-6f7579459425,claude-opus-4-1-20250805,anthropic,pytorch-model-cli,5045,4010,9055,496.116245,True,1.0,claude-opus-4-1-20250805,pytorch-model-cli,496.116245,True,0.4285714285714285,True,496.116245 +04968b24-13d5-41f7-8863-8a20b73666bc,grok-code-fast-1,xai,build-initramfs-qemu,2192,1477,3669,148.588737,False,0.0,grok-code-fast-1,build-initramfs-qemu,148.588737,False,0.0,False,148.588737 +fb88a68e-8936-4759-8ad6-58b5cd07cd59,gemini-2.5-flash,gemini,build-pmars,19169,7817,26986,526.52064,True,1.0,gemini-2.5-flash,build-pmars,526.52064,True,0.8,True,526.52064 +72441315-2887-46c0-9164-780e68361e70,claude-sonnet-4-20250514,anthropic,video-processing,5354,4328,9682,238.995213,False,0.0,claude-sonnet-4-20250514,video-processing,238.995213,False,0.0,False,238.995213 +9679a48a-c639-4284-b212-2b0f33001376,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,regex-log,5042,4332,9374,837.614507,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,regex-log,837.614507,True,0.2,True,837.614507 +e44cf683-bc75-4d8b-8af8-878d6cdf9e1a,gemini-2.5-flash,gemini,dna-insert,5421,2096,7517,384.723377,False,0.0,gemini-2.5-flash,dna-insert,384.723377,False,0.0,False,384.723377 +7b75891e-17bb-4be9-aaad-b7e6cf32fddb,deepseek-ai/DeepSeek-V3.1,together_ai,sparql-university,8498,3397,11895,770.924272,False,0.0,deepseek-ai/DeepSeek-V3.1,sparql-university,770.924272,False,0.0,False,770.924272 +8b012a4f-39f6-4bf0-af46-fda21c0af6cb,grok-4-0709,xai,sparql-university,9887,3666,13553,900.042243,False,0.0,grok-4-0709,sparql-university,900.042243,False,0.4,False,900.042243 +28107a4a-8f31-47f0-a3fc-3bcc76503248,grok-code-fast-1,xai,dna-assembly,1807,1180,2987,59.790115,False,0.0,grok-code-fast-1,dna-assembly,59.790115,False,0.0,False,59.790115 +d5b34d69-68b6-4144-93c4-d20890f88e84,gemini-2.5-flash,gemini,large-scale-text-editing,3604,2492,6096,203.000537,False,0.0,gemini-2.5-flash,large-scale-text-editing,203.000537,False,0.0,False,203.000537 +9dbbaf1b-8b17-4c1c-9011-833f4e8a6193,openai/gpt-oss-120b,together_ai,polyglot-rust-c,2798,5813,8611,900.017479,False,0.0,openai/gpt-oss-120b,polyglot-rust-c,900.017479,False,0.0,False,900.017479 +623a966d-53ac-450c-96d8-8d84204ff3aa,grok-code-fast-1,xai,fix-git,2135,1599,3734,82.770473,False,0.0,grok-code-fast-1,fix-git,82.770473,False,0.2,False,82.770473 +4c25ebc8-f90f-461c-822e-c2bc870ee96b,moonshotai/Kimi-K2-Instruct-0905,together_ai,cobol-modernization,14048,11829,25877,915.755655,False,0.0,moonshotai/Kimi-K2-Instruct-0905,cobol-modernization,915.755655,False,0.6,False,915.755655 +6634cdb8-cbb3-4206-aa65-6b897fdb6bb2,grok-code-fast-1,xai,large-scale-text-editing,2523,1083,3606,106.596472,False,0.0,grok-code-fast-1,large-scale-text-editing,106.596472,False,0.0,False,106.596472 +5ca54a18-7919-4eb2-b504-3aa291b3a3f4,gpt-5-mini,openai,dna-insert,4874,4862,9736,369.690304,False,0.0,gpt-5-mini,dna-insert,369.690304,False,0.0,False,369.690304 +27d7f820-23b9-4ef4-b0af-26f76c5a9ef0,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-alpine-ssh,1927,2145,4072,234.124801,False,0.0,zai-org/GLM-4.5-Air-FP8,qemu-alpine-ssh,234.124801,False,0.0,False,234.124801 +4244576d-586c-4f42-ac93-0c4ded3eead1,gemini-2.5-flash,gemini,reshard-c4-data,13753,11188,24941,687.971142,False,0.0,gemini-2.5-flash,reshard-c4-data,687.971142,False,0.0,False,687.971142 +802a0ccf-7dc4-47cf-91c2-5ccd9713cfc3,gpt-5,openai,count-dataset-tokens,2825,4779,7604,900.418506,False,0.0,gpt-5,count-dataset-tokens,900.418506,False,0.1666666666666666,False,900.418506 +03676562-8dfd-41c2-813c-068d914ec293,gemini-2.5-pro,gemini,chess-best-move,11141,8090,19231,901.276443,False,0.0,gemini-2.5-pro,chess-best-move,901.276443,False,0.0,False,901.276443 +06150deb-40ab-4945-a75a-8868751e998b,gemini-2.5-flash,gemini,build-pmars,12507,3986,16493,297.764865,True,1.0,gemini-2.5-flash,build-pmars,297.764865,True,0.8,True,297.764865 +507be476-27a6-4de9-822b-72a86043bdcd,gpt-5,openai,fix-ocaml-gc,23883,24477,48360,3607.458276,False,0.0,gpt-5,fix-ocaml-gc,3607.458276,False,0.0,False,3607.458276 +caa90f1a-6279-4eae-bb47-a68dfac3e0ac,gemini-2.5-flash,gemini,write-compressor,11646,42135,53781,917.835988,False,0.0,gemini-2.5-flash,write-compressor,917.835988,False,0.0,False,917.835988 +1c09673c-966a-4744-9bfd-040cf0badc26,gpt-5-mini,openai,large-scale-text-editing,23907,7411,31318,1211.098618,False,0.0,gpt-5-mini,large-scale-text-editing,1211.098618,False,0.2,False,1211.098618 +30ccdbd1-60e5-449c-94ac-84642f8b8131,gemini-2.5-pro,gemini,install-windows-3.11,6872,2321,9193,1216.939536,False,0.0,gemini-2.5-pro,install-windows-3.11,1216.939536,False,0.0,False,1216.939536 +c40c8646-7196-4bc4-a2fc-e6f1f067b0f6,grok-code-fast-1,xai,merge-diff-arc-agi-task,8254,2288,10542,282.980675,True,1.0,grok-code-fast-1,merge-diff-arc-agi-task,282.980675,True,0.8,True,282.980675 +15165a39-69c1-4c0f-bf4c-71bf15f19fea,claude-opus-4-1-20250805,anthropic,hf-model-inference,6660,4120,10780,955.236685,False,0.0,claude-opus-4-1-20250805,hf-model-inference,955.236685,False,0.25,False,955.236685 +4ccaa0b7-63a0-4c03-84c2-ab8046d5f886,deepseek-ai/DeepSeek-V3.1,together_ai,train-fasttext,19616,6631,26247,1980.26789,False,0.0,deepseek-ai/DeepSeek-V3.1,train-fasttext,1980.26789,False,0.0,False,1980.26789 +e7c1926a-9ebd-4f80-afe1-ac4f395b4824,moonshotai/Kimi-K2-Instruct-0905,together_ai,bn-fit-modify,18382,7954,26336,1182.862434,False,0.0,moonshotai/Kimi-K2-Instruct-0905,bn-fit-modify,1182.862434,False,0.0,False,1182.862434 +d5df5d43-7d4d-436b-9bcd-4929ce745323,claude-sonnet-4-20250514,anthropic,mteb-retrieve,2704,2043,4747,468.498031,False,0.0,claude-sonnet-4-20250514,mteb-retrieve,468.498031,False,0.0,False,468.498031 +ec738d5b-eda5-4824-94eb-4c266247d441,gpt-5-mini,openai,prove-plus-comm,1737,865,2602,170.22793,True,1.0,gpt-5-mini,prove-plus-comm,170.22793,True,0.6,True,170.22793 +adb67505-f120-4d11-a68f-68a9689ee93f,claude-opus-4-1-20250805,anthropic,fix-code-vulnerability,15142,9083,24225,900.460466,False,0.0,claude-opus-4-1-20250805,fix-code-vulnerability,900.460466,False,0.125,False,900.460466 +e69573f8-1005-43c1-97a6-de53ad690f46,gemini-2.5-pro,gemini,adaptive-rejection-sampler,9822,4783,14605,526.494362,False,0.0,gemini-2.5-pro,adaptive-rejection-sampler,526.494362,False,0.4,False,526.494362 +89a1c6ab-7123-4a5c-9532-a75973c98d28,gemini-2.5-flash,gemini,mteb-leaderboard,936,365,1301,100.554383,False,0.0,gemini-2.5-flash,mteb-leaderboard,100.554383,False,0.0,False,100.554383 +686fb927-8a47-4d41-aa5a-30b8e72e08a8,grok-code-fast-1,xai,code-from-image,4943,807,5750,130.496806,False,0.0,grok-code-fast-1,code-from-image,130.496806,False,0.0,False,130.496806 +0e79fa68-6f33-46be-92fa-282233ca20e8,moonshotai/Kimi-K2-Instruct-0905,together_ai,git-leak-recovery,3158,2546,5704,266.738993,True,1.0,moonshotai/Kimi-K2-Instruct-0905,git-leak-recovery,266.738993,True,1.0,True,266.738993 +35c29313-afc7-4511-abe8-13b9c9177d42,grok-code-fast-1,xai,openssl-selfsigned-cert,1653,1022,2675,71.394297,False,0.0,grok-code-fast-1,openssl-selfsigned-cert,71.394297,False,0.2,False,71.394297 +53551a68-9fd5-4e9c-baf4-c65cc45331a1,gpt-5-nano,openai,constraints-scheduling,3138,2922,6060,184.273481,False,0.0,gpt-5-nano,constraints-scheduling,184.273481,False,0.4,False,184.273481 +61c6b66d-acfa-447f-9815-abb99f588e43,zai-org/GLM-4.5-Air-FP8,together_ai,cancel-async-tasks,831,2244,3075,170.509257,False,0.0,zai-org/GLM-4.5-Air-FP8,cancel-async-tasks,170.509257,False,0.2,False,170.509257 +2e826f40-86e4-4c76-a38a-72e7b3d3155a,claude-opus-4-1-20250805,anthropic,fix-code-vulnerability,15436,5755,21191,273.411887,True,1.0,claude-opus-4-1-20250805,fix-code-vulnerability,273.411887,True,0.125,True,273.411887 +f913d927-aada-47cc-b8b5-1a3bf9f0749b,gpt-5,openai,count-dataset-tokens,8789,3965,12754,668.834334,False,0.0,gpt-5,count-dataset-tokens,668.834334,False,0.1666666666666666,False,668.834334 +f09e523d-0fd0-45c2-b101-c1a8ef503cf2,gpt-5-nano,openai,sanitize-git-repo,8259,5812,14071,924.750022,False,0.0,gpt-5-nano,sanitize-git-repo,924.750022,False,0.0,False,924.750022 +3809efb8-5704-4b2c-88b2-d3a3ac7e6577,deepseek-ai/DeepSeek-V3.1,together_ai,circuit-fibsqrt,12474,9952,22426,2121.039872,False,0.0,deepseek-ai/DeepSeek-V3.1,circuit-fibsqrt,2121.039872,False,0.0,False,2121.039872 +cb9c8422-c024-410c-ac0b-2be8a204cd66,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,git-leak-recovery,2251,1612,3863,93.864496,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,git-leak-recovery,93.864496,True,1.0,True,93.864496 +42d71610-09fb-4716-ad4b-d376e95eca25,claude-opus-4-1-20250805,anthropic,fix-ocaml-gc,27458,16957,44415,3605.734469,False,0.0,claude-opus-4-1-20250805,fix-ocaml-gc,3605.734469,False,0.5,False,3605.734469 +01badb25-d302-4572-8890-cbcc60e20851,claude-opus-4-1-20250805,anthropic,schemelike-metacircular-eval,19172,14718,33890,896.959935,False,0.0,claude-opus-4-1-20250805,schemelike-metacircular-eval,896.959935,False,0.0,False,896.959935 +efb8c4b4-7411-4c5d-a449-d5d4f6cf1f20,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,large-scale-text-editing,3542,1208,4750,73.994836,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,large-scale-text-editing,73.994836,False,0.0,False,73.994836 +a7f11ae4-baec-4d2d-a80d-0d88afbac197,gemini-2.5-flash,gemini,dna-assembly,1483,21040,22523,738.785815,False,0.0,gemini-2.5-flash,dna-assembly,738.785815,False,0.0,False,738.785815 +230a3ee5-9a5d-4e90-aa54-3677f3dd4904,gemini-2.5-flash,gemini,password-recovery,2804,6441,9245,900.081882,False,0.0,gemini-2.5-flash,password-recovery,900.081882,False,0.0,False,900.081882 +ec7e1452-1173-4307-9cc5-a079226c594b,gpt-5-mini,openai,write-compressor,3929,2069,5998,200.739629,False,0.0,gpt-5-mini,write-compressor,200.739629,False,0.0,False,200.739629 +680286e7-125b-4569-b57c-1b81ffa58f22,zai-org/GLM-4.5-Air-FP8,together_ai,fix-git,5504,3095,8599,56.829034,True,1.0,zai-org/GLM-4.5-Air-FP8,fix-git,56.829034,True,0.6,True,56.829034 +ff190d1a-d2a0-4418-bb98-59957e4a1c69,grok-4-0709,xai,schemelike-metacircular-eval,8735,4593,13328,2409.700032,False,0.0,grok-4-0709,schemelike-metacircular-eval,2409.700032,False,0.0,False,2409.700032 +8b737da3-a70e-49e7-a047-d8094973eec4,gemini-2.5-pro,gemini,build-initramfs-qemu,6654,2682,9336,615.238579,False,0.0,gemini-2.5-pro,build-initramfs-qemu,615.238579,False,0.0,False,615.238579 +d4049088-08a1-4225-b023-2d1de1163a3c,grok-4-0709,xai,sqlite-db-truncate,3109,2226,5335,910.658276,False,0.0,grok-4-0709,sqlite-db-truncate,910.658276,False,0.0,False,910.658276 +1b0a2cc5-d2e5-46c6-bfa2-c4f63d43072d,gemini-2.5-flash,gemini,financial-document-processor,10759,16826,27585,1203.330971,False,0.0,gemini-2.5-flash,financial-document-processor,1203.330971,False,0.0,False,1203.330971 +e3a55e78-036b-42c2-b8e3-8f7d6756eeea,grok-code-fast-1,xai,dna-insert,6346,2058,8404,146.885531,False,0.0,grok-code-fast-1,dna-insert,146.885531,False,0.0,False,146.885531 +680d091d-b56f-4390-ae80-3093fd2f9848,gpt-5-nano,openai,nginx-request-logging,3778,1996,5774,364.983412,False,0.0,gpt-5-nano,nginx-request-logging,364.983412,False,0.0,False,364.983412 +b9e62e60-c9f5-4fbd-9126-92ba8a0de0c6,gpt-5-mini,openai,large-scale-text-editing,6505,6116,12621,1208.139785,False,0.0,gpt-5-mini,large-scale-text-editing,1208.139785,False,0.2,False,1208.139785 +b2c4efb1-f942-4c47-92ab-c68ee78a2121,gemini-2.5-pro,gemini,path-tracing,2403,2552,4955,347.161579,False,0.0,gemini-2.5-pro,path-tracing,347.161579,False,0.0,False,347.161579 +90c3c2ca-b2f1-4700-b045-a8c89364cddd,gemini-2.5-pro,gemini,feal-linear-cryptanalysis,7406,9833,17239,1801.078126,False,0.0,gemini-2.5-pro,feal-linear-cryptanalysis,1801.078126,False,0.0,False,1801.078126 +64b0f6c2-ddff-40b2-b7f8-f13f58175153,zai-org/GLM-4.5-Air-FP8,together_ai,build-pov-ray,34987,15890,50877,2846.885745,False,0.0,zai-org/GLM-4.5-Air-FP8,build-pov-ray,2846.885745,False,0.0,False,2846.885745 +86bdef5a-7f00-46fe-a1da-e049def48660,gpt-5-mini,openai,dna-assembly,5233,6122,11355,230.196528,False,0.0,gpt-5-mini,dna-assembly,230.196528,False,0.0,False,230.196528 +568e0102-19d3-4ef4-8bb9-cfaee50d42b1,grok-4-0709,xai,extract-elf,1522,2157,3679,904.723108,False,0.0,grok-4-0709,extract-elf,904.723108,False,0.2,False,904.723108 +8577cfaa-3a2a-46cd-a6de-54c6eae6dfc7,grok-4-0709,xai,reshard-c4-data,3283,2824,6107,901.523752,False,0.0,grok-4-0709,reshard-c4-data,901.523752,False,0.0,False,901.523752 +3a93cf5c-a5ea-49e4-8b6d-5faaa625fb56,grok-4-0709,xai,video-processing,1770,1090,2860,252.691189,False,0.0,grok-4-0709,video-processing,252.691189,False,0.0,False,252.691189 +b06b8e32-eec1-4113-961f-72a24749878b,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing-reverse,25688,17839,43527,1808.218798,False,0.0,deepseek-ai/DeepSeek-V3.1,path-tracing-reverse,1808.218798,False,0.2,False,1808.218798 +a4c88d8d-cd05-4789-b7c9-bbb8c134b2a8,gpt-5,openai,extract-elf,5124,4338,9462,558.509989,False,0.0,gpt-5,extract-elf,558.509989,False,0.2857142857142857,False,558.509989 +a6d26931-9a2b-4a2c-ae40-d0c8af583cb9,grok-4-0709,xai,reverse-engineering,10655,3560,14215,1800.064454,False,0.0,grok-4-0709,reverse-engineering,1800.064454,False,0.2,False,1800.064454 +03e297f7-5713-4f58-a832-08c5bde03d26,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,tune-mjcf,5490,3782,9272,476.42247,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,tune-mjcf,476.42247,False,0.0,False,476.42247 +ff2984fe-8406-4aa9-9988-26b6919961fd,gpt-5-mini,openai,sparql-university,8825,5404,14229,305.642809,False,0.0,gpt-5-mini,sparql-university,305.642809,False,0.0,False,305.642809 +cff297dc-7d6b-4018-b305-fc0f39d79384,claude-opus-4-1-20250805,anthropic,polyglot-c-py,10263,5904,16167,181.783692,False,0.0,claude-opus-4-1-20250805,polyglot-c-py,181.783692,False,0.0,False,181.783692 +fbed5025-a81d-4502-9017-527a16222baa,claude-sonnet-4-20250514,anthropic,extract-elf,6098,3867,9965,262.716691,False,0.0,claude-sonnet-4-20250514,extract-elf,262.716691,False,0.2,False,262.716691 +cd91bf5f-b311-4160-a9ae-63982c217631,gemini-2.5-flash,gemini,mteb-leaderboard,982,439,1421,327.728106,False,0.0,gemini-2.5-flash,mteb-leaderboard,327.728106,False,0.0,False,327.728106 +588ead5f-6057-4782-9ef9-75c05f1c98bf,gemini-2.5-pro,gemini,install-windows-3.11,16597,6901,23498,902.519851,False,0.0,gemini-2.5-pro,install-windows-3.11,902.519851,False,0.0,False,902.519851 +7d5be542-d466-448e-a3ff-90dcf5b16d34,gemini-2.5-pro,gemini,install-klee-minimal,9156,1424,10580,900.284624,False,0.0,gemini-2.5-pro,install-klee-minimal,900.284624,False,0.0,False,900.284624 +e3db734e-eeb3-40e9-a923-66b4270fa87b,openai/gpt-oss-120b,together_ai,distribution-search,1728,1974,3702,94.120256,False,0.0,openai/gpt-oss-120b,distribution-search,94.120256,False,0.0,False,94.120256 +c0862183-8e5b-4ce4-a85d-61b58affe465,OpenAI/gpt-oss-20B,together_ai,count-dataset-tokens,3223,9956,13179,731.413682,False,0.0,OpenAI/gpt-oss-20B,count-dataset-tokens,731.413682,False,0.0,False,731.413682 +030828da-6675-4d8d-8d91-cef45fcda67e,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pmars,9941,4334,14275,489.769214,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pmars,489.769214,False,0.2,False,489.769214 +a71688f3-d6ed-45dd-a6ac-e7d58162c60b,grok-code-fast-1,xai,pytorch-model-cli,2749,1376,4125,255.958622,False,0.0,grok-code-fast-1,pytorch-model-cli,255.958622,False,0.0,False,255.958622 +835e01a1-3a0c-4cd9-9ae1-62774e9554f8,OpenAI/gpt-oss-20B,together_ai,feal-linear-cryptanalysis,4191,15903,20094,1819.826953,False,0.0,OpenAI/gpt-oss-20B,feal-linear-cryptanalysis,1819.826953,False,0.0,False,1819.826953 +0daff0df-347c-43d7-aec9-94141316e1cf,claude-opus-4-1-20250805,anthropic,git-leak-recovery,3242,1945,5187,245.159802,True,1.0,claude-opus-4-1-20250805,git-leak-recovery,245.159802,True,1.0,True,245.159802 +f2faf36e-b0f2-43cd-a284-924ff7d50adb,deepseek-ai/DeepSeek-V3.1,together_ai,run-pdp11-code,20588,12625,33213,1012.509882,False,0.0,deepseek-ai/DeepSeek-V3.1,run-pdp11-code,1012.509882,False,0.0,False,1012.509882 +8f39ec56-51af-497a-bd4f-235c50aa2fe0,moonshotai/Kimi-K2-Instruct-0905,together_ai,configure-git-webserver,4271,3098,7369,604.730001,True,1.0,moonshotai/Kimi-K2-Instruct-0905,configure-git-webserver,604.730001,True,0.6,True,604.730001 +40276b94-d5bc-484e-9b87-78c8e2981b25,claude-sonnet-4-20250514,anthropic,log-summary-date-ranges,9073,2925,11998,281.754222,True,1.0,claude-sonnet-4-20250514,log-summary-date-ranges,281.754222,True,1.0,True,281.754222 +0acbeb7c-6c3a-404b-8dfe-a0d9aacc7d93,OpenAI/gpt-oss-20B,together_ai,configure-git-webserver,1363,1056,2419,104.181251,False,0.0,OpenAI/gpt-oss-20B,configure-git-webserver,104.181251,False,0.2,False,104.181251 +6cd1a883-1863-4e38-a56b-4ea43bd653cb,gpt-5-nano,openai,db-wal-recovery,5355,8923,14278,906.782637,False,0.0,gpt-5-nano,db-wal-recovery,906.782637,False,0.0,False,906.782637 +4e9690a0-647b-4a23-8f7a-5af107c2da6e,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-windows-3.11,8343,2729,11072,199.669191,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-windows-3.11,199.669191,False,0.0,False,199.669191 +baa7b454-08dc-40a5-a261-6046202442db,gpt-5,openai,code-from-image,13475,16543,30018,1220.118122,False,0.0,gpt-5,code-from-image,1220.118122,False,0.4,False,1220.118122 +6184b94b-1597-419a-9424-f1278aaffd17,claude-opus-4-1-20250805,anthropic,sqlite-with-gcov,9496,1395,10891,162.582046,True,1.0,claude-opus-4-1-20250805,sqlite-with-gcov,162.582046,True,0.5714285714285714,True,162.582046 +81d164d0-a2d4-4114-92d9-c46365ba523c,claude-opus-4-1-20250805,anthropic,form-filling,6368,4704,11072,152.590298,True,1.0,claude-opus-4-1-20250805,form-filling,152.590298,True,1.0,True,152.590298 +0443b97d-fb79-40d8-8221-e8fb98f8b037,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sparql-university,8004,2078,10082,197.593441,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sparql-university,197.593441,False,0.0,False,197.593441 +376f51b0-482f-4d72-a54a-489420db51cd,gpt-5-nano,openai,reshard-c4-data,9928,15415,25343,1684.60652,False,0.0,gpt-5-nano,reshard-c4-data,1684.60652,False,0.0,False,1684.60652 +7544d79b-faf8-4792-b142-3881601ce82f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,nginx-request-logging,7763,5454,13217,900.532029,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,nginx-request-logging,900.532029,True,0.4,True,900.532029 +eadedfe7-471b-4113-b853-13d373ac303a,grok-code-fast-1,xai,fix-git,7396,1931,9327,199.538043,False,0.0,grok-code-fast-1,fix-git,199.538043,False,0.2,False,199.538043 +6c2f19d7-baac-4cbe-8e8b-5c7baa11ffc3,OpenAI/gpt-oss-20B,together_ai,run-pdp11-code,368,2159,2527,85.666112,False,0.0,OpenAI/gpt-oss-20B,run-pdp11-code,85.666112,False,0.0,False,85.666112 +d31531be-74a4-41fe-8d73-2d6d2065482c,grok-code-fast-1,xai,model-extraction-relu-logits,1378,905,2283,151.89274,False,0.0,grok-code-fast-1,model-extraction-relu-logits,151.89274,False,0.0,False,151.89274 +eb30c74b-1c11-4009-b244-0677bdd2ca51,OpenAI/gpt-oss-20B,together_ai,fix-ocaml-gc,230,1247,1477,197.872133,False,0.0,OpenAI/gpt-oss-20B,fix-ocaml-gc,197.872133,False,0.0,False,197.872133 +8729d83e-2e4c-47af-9e5e-6af1b56cdce6,gemini-2.5-flash,gemini,hf-model-inference,2734,2335,5069,200.120874,False,0.0,gemini-2.5-flash,hf-model-inference,200.120874,False,0.6,False,200.120874 +2d23f238-75a0-4324-a18b-2f4a99a3918d,gpt-5,openai,sqlite-db-truncate,6252,4894,11146,859.7268,False,0.0,gpt-5,sqlite-db-truncate,859.7268,False,0.0,False,859.7268 +2fdd92d7-8a94-49c1-afe2-96efcf838124,openai/gpt-oss-120b,together_ai,db-wal-recovery,7134,16943,24077,900.433352,False,0.0,openai/gpt-oss-120b,db-wal-recovery,900.433352,False,0.0,False,900.433352 +0f6ed156-2a7c-4e1b-8af3-130ee219fca8,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pmars,17120,5991,23111,773.995493,True,1.0,moonshotai/Kimi-K2-Instruct-0905,build-pmars,773.995493,True,0.8,True,773.995493 +1054c334-ecb1-4b78-a16a-47f17890bc15,gpt-5-mini,openai,nginx-request-logging,4066,1723,5789,130.411973,False,0.0,gpt-5-mini,nginx-request-logging,130.411973,False,0.4,False,130.411973 +4e597b9a-c5ef-4b59-8223-5e86513af6fb,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,write-compressor,7407,6440,13847,946.012866,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,write-compressor,946.012866,False,0.0,False,946.012866 +11011d35-bc84-4e16-8968-39f29c8348e1,gpt-5,openai,path-tracing-reverse,7616,3365,10981,440.426682,False,0.0,gpt-5,path-tracing-reverse,440.426682,False,0.0,False,440.426682 +64931b53-228e-46a7-aa3a-1526a1b8d21a,OpenAI/gpt-oss-20B,together_ai,install-windows-3.11,6726,7056,13782,186.712339,False,0.0,OpenAI/gpt-oss-20B,install-windows-3.11,186.712339,False,0.0,False,186.712339 +1a30ce31-6524-4788-b1d4-39553d21138a,gemini-2.5-pro,gemini,extract-elf,7823,1835,9658,281.684665,False,0.0,gemini-2.5-pro,extract-elf,281.684665,False,0.0,False,281.684665 +8bbabfb2-264b-4fae-9d0e-133db184896b,gpt-5,openai,wasm-pipeline,5179,4558,9737,171.387898,True,1.0,gpt-5,wasm-pipeline,171.387898,True,1.0,True,171.387898 +1d6e26a9-bf0f-413d-ab38-9145a37eb8a8,grok-code-fast-1,xai,pytorch-model-cli,4611,1450,6061,158.553553,False,0.0,grok-code-fast-1,pytorch-model-cli,158.553553,False,0.0,False,158.553553 +95b1447f-94af-44e4-bf0e-2d3c1e93f571,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,code-from-image,8429,5333,13762,626.83562,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,code-from-image,626.83562,False,0.2,False,626.83562 +f9f68cdd-0841-42d5-9e3e-d98afcbd13a7,gpt-5-nano,openai,qemu-alpine-ssh,3531,5188,8719,902.626363,False,0.0,gpt-5-nano,qemu-alpine-ssh,902.626363,False,0.0,False,902.626363 +d778b3e1-fea8-4591-85c5-1c5e30b77431,claude-opus-4-1-20250805,anthropic,mteb-leaderboard,1554,1342,2896,202.93684,False,0.0,claude-opus-4-1-20250805,mteb-leaderboard,202.93684,False,0.0,False,202.93684 +af25f61f-d195-4b62-a981-5f9578096df8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing-reverse,2727,3008,5735,210.439191,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing-reverse,210.439191,False,0.0,False,210.439191 +1bc493ca-b967-454b-810a-8e4ea750c986,claude-opus-4-1-20250805,anthropic,qemu-startup,2761,3324,6085,593.711255,True,1.0,claude-opus-4-1-20250805,qemu-startup,593.711255,True,0.4285714285714285,True,593.711255 +71c7f1e5-b7e4-429c-b9bf-44731d4e12f0,moonshotai/Kimi-K2-Instruct-0905,together_ai,code-from-image,8417,4376,12793,407.311086,True,1.0,moonshotai/Kimi-K2-Instruct-0905,code-from-image,407.311086,True,0.6,True,407.311086 +2fbed525-2d74-40bb-8b93-e42bfebbb3ec,claude-sonnet-4-20250514,anthropic,regex-log,3507,3057,6564,238.051022,True,1.0,claude-sonnet-4-20250514,regex-log,238.051022,True,0.8,True,238.051022 +5f2aef4b-b0b8-4748-9fe2-300b50550ede,claude-opus-4-1-20250805,anthropic,regex-log,2434,2317,4751,128.282453,False,0.0,claude-opus-4-1-20250805,regex-log,128.282453,False,0.5714285714285714,False,128.282453 +90ddfb49-9480-4d32-8da1-4ef6dfb95e4b,OpenAI/gpt-oss-20B,together_ai,openssl-selfsigned-cert,1789,1077,2866,31.62658,True,1.0,OpenAI/gpt-oss-20B,openssl-selfsigned-cert,31.62658,True,0.2,True,31.62658 +83f1cb26-954b-4f4e-a648-7e09fd2f6e7f,gpt-5-nano,openai,run-pdp11-code,13690,4947,18637,1021.511765,False,0.0,gpt-5-nano,run-pdp11-code,1021.511765,False,0.0,False,1021.511765 +9a8b20b6-24d5-4e60-b57b-390e8230ab1a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-linear-cryptanalysis,22965,21057,44022,1819.064592,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-linear-cryptanalysis,1819.064592,False,0.0,False,1819.064592 +a3a0c9e8-d57a-4abd-96a8-fb603013966b,gpt-5,openai,sqlite-db-truncate,5162,4227,9389,345.961631,False,0.0,gpt-5,sqlite-db-truncate,345.961631,False,0.0,False,345.961631 +6376dd52-f3f3-4d29-92eb-999aa68b0584,deepseek-ai/DeepSeek-V3.1,together_ai,pypi-server,3908,2465,6373,144.712043,True,1.0,deepseek-ai/DeepSeek-V3.1,pypi-server,144.712043,True,0.4,True,144.712043 +bbd20cd8-d85d-4209-aa0e-7f903574c031,gpt-5-nano,openai,dna-assembly,12114,16132,28246,749.742164,False,0.0,gpt-5-nano,dna-assembly,749.742164,False,0.0,False,749.742164 +2ee94be4-7881-45ac-a7a1-41a61464b228,claude-opus-4-1-20250805,anthropic,write-compressor,13380,9224,22604,911.137481,False,0.0,claude-opus-4-1-20250805,write-compressor,911.137481,False,0.0,False,911.137481 +14de5547-a198-4697-8d0d-c151112df426,openai/gpt-oss-120b,together_ai,mteb-retrieve,1927,762,2689,90.518879,False,0.0,openai/gpt-oss-120b,mteb-retrieve,90.518879,False,0.0,False,90.518879 +dcbf2602-8b4b-4bda-a165-cdeaa56bf48f,gemini-2.5-flash,gemini,merge-diff-arc-agi-task,10965,5959,16924,593.534303,False,0.0,gemini-2.5-flash,merge-diff-arc-agi-task,593.534303,False,0.0,False,593.534303 +126658b8-b075-40a4-b379-221579a64bcc,openai/gpt-oss-120b,together_ai,build-initramfs-qemu,2603,2754,5357,303.618472,False,0.0,openai/gpt-oss-120b,build-initramfs-qemu,303.618472,False,0.0,False,303.618472 +2bb85130-9b8f-45fb-a35d-d8f8b6c0f1de,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,configure-git-webserver,10090,6556,16646,627.071429,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,configure-git-webserver,627.071429,False,0.6,False,627.071429 +8e1c2727-a184-4e68-ba6e-58e6a218776b,gpt-5-nano,openai,log-summary-date-ranges,2360,1815,4175,160.143288,False,0.0,gpt-5-nano,log-summary-date-ranges,160.143288,False,0.0,False,160.143288 +e903a8f8-0616-4a61-8bcd-e9b1243ead70,gpt-5,openai,nginx-request-logging,3452,1030,4482,287.752694,True,1.0,gpt-5,nginx-request-logging,287.752694,True,1.0,True,287.752694 +c35a1676-903b-406e-af91-f0375f114072,OpenAI/gpt-oss-20B,together_ai,install-windows-3.11,3136,595,3731,39.093198,False,0.0,OpenAI/gpt-oss-20B,install-windows-3.11,39.093198,False,0.0,False,39.093198 +e21d5e09-1e84-4f46-ba25-82c475a5254e,deepseek-ai/DeepSeek-V3.1,together_ai,count-dataset-tokens,13392,4657,18049,741.614968,False,0.0,deepseek-ai/DeepSeek-V3.1,count-dataset-tokens,741.614968,False,0.0,False,741.614968 +36635844-4c1b-4cf2-a891-30393acca1bc,gpt-5-nano,openai,train-fasttext,14014,14333,28347,3600.692619,False,0.0,gpt-5-nano,train-fasttext,3600.692619,False,0.0,False,3600.692619 +d7af17dd-2c83-4d4e-9f5d-db12d7fe76db,gpt-5-mini,openai,cobol-modernization,6779,3569,10348,348.578684,True,1.0,gpt-5-mini,cobol-modernization,348.578684,True,1.0,True,348.578684 +8ef8fa0d-989d-45b0-a3f5-4b1a1a3eabcf,gemini-2.5-flash,gemini,dna-assembly,3958,3144,7102,337.615446,False,0.0,gemini-2.5-flash,dna-assembly,337.615446,False,0.0,False,337.615446 +9e365c1e-fc30-4efe-8a9f-867caa971807,grok-code-fast-1,xai,build-pov-ray,21368,7097,28465,2571.284066,False,0.0,grok-code-fast-1,build-pov-ray,2571.284066,False,0.2,False,2571.284066 +34d09eb7-be5c-4b41-8823-ac82595bd8bb,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pmars,15643,5765,21408,669.615436,True,1.0,moonshotai/Kimi-K2-Instruct-0905,build-pmars,669.615436,True,0.8,True,669.615436 +8bf118f7-ad47-44a6-a584-5b16a67c7ccf,moonshotai/Kimi-K2-Instruct-0905,together_ai,hf-model-inference,6506,4606,11112,403.607774,False,0.0,moonshotai/Kimi-K2-Instruct-0905,hf-model-inference,403.607774,False,0.0,False,403.607774 +c8a589b7-1969-40cb-8acd-4a92970a856d,grok-4-0709,xai,build-initramfs-qemu,4090,3343,7433,913.24577,False,0.0,grok-4-0709,build-initramfs-qemu,913.24577,False,0.0,False,913.24577 +7f803f68-3bc2-4887-8159-f1d65b547847,gemini-2.5-pro,gemini,pytorch-model-recovery,9591,5529,15120,874.427811,True,1.0,gemini-2.5-pro,pytorch-model-recovery,874.427811,True,1.0,True,874.427811 +de054569-f5c4-4dca-b603-d3982af0c590,gemini-2.5-flash,gemini,code-from-image,1456,1051,2507,157.591857,False,0.0,gemini-2.5-flash,code-from-image,157.591857,False,0.4,False,157.591857 +524f65d5-7371-4411-af61-8677b044a050,claude-sonnet-4-20250514,anthropic,sqlite-with-gcov,13154,3799,16953,773.164517,False,0.0,claude-sonnet-4-20250514,sqlite-with-gcov,773.164517,False,0.2,False,773.164517 +1a70ae1a-a9e7-428c-a762-8ef33b77657b,gpt-5-mini,openai,gpt2-codegolf,1377,1040,2417,238.689972,False,0.0,gpt-5-mini,gpt2-codegolf,238.689972,False,0.0,False,238.689972 +734e3d25-3eb1-4c32-8619-dc372f72e124,gemini-2.5-pro,gemini,polyglot-c-py,1446,1279,2725,90.301479,False,0.0,gemini-2.5-pro,polyglot-c-py,90.301479,False,0.2,False,90.301479 +366b9c98-329c-48a9-91dd-1cebf50935fc,openai/gpt-oss-120b,together_ai,video-processing,1669,988,2657,75.652025,False,0.0,openai/gpt-oss-120b,video-processing,75.652025,False,0.0,False,75.652025 +2b0b634a-4a78-46d9-bbd5-62dc9b0efc36,claude-opus-4-1-20250805,anthropic,qemu-alpine-ssh,2409,2462,4871,287.888495,True,1.0,claude-opus-4-1-20250805,qemu-alpine-ssh,287.888495,True,0.8571428571428571,True,287.888495 +f7fa1c4c-d940-4b04-b3c8-5186d91383e3,claude-opus-4-1-20250805,anthropic,break-filter-js-from-html,10490,9299,19789,1038.054024,True,1.0,claude-opus-4-1-20250805,break-filter-js-from-html,1038.054024,True,0.2222222222222222,True,1038.054024 +d564e1c7-5dd3-47f3-8f3f-040ebdf8350d,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-recovery,7320,5777,13097,901.315843,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-recovery,901.315843,False,0.4,False,901.315843 +0612a6b7-c7a4-4478-873b-d3d8a36c0905,claude-opus-4-1-20250805,anthropic,polyglot-c-py,3347,2567,5914,232.122145,False,0.0,claude-opus-4-1-20250805,polyglot-c-py,232.122145,False,0.0,False,232.122145 +b60b1632-07b4-4154-ab1f-ce7b6b812d03,OpenAI/gpt-oss-20B,together_ai,pytorch-model-recovery,2217,13429,15646,915.069511,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-recovery,915.069511,False,0.0,False,915.069511 +5a203e45-b3c1-4c5e-a44c-968966050856,gpt-5-nano,openai,sanitize-git-repo,14111,7238,21349,900.283965,False,0.0,gpt-5-nano,sanitize-git-repo,900.283965,False,0.0,False,900.283965 +ab4fff6e-2999-43c2-9776-726b1efa65c2,gpt-5-mini,openai,crack-7z-hash,2048,770,2818,87.18888,False,0.0,gpt-5-mini,crack-7z-hash,87.18888,False,0.0,False,87.18888 +ffc9fe52-e07e-4726-a42a-94151ebf1e33,claude-opus-4-1-20250805,anthropic,large-scale-text-editing,5771,4440,10211,460.53846,True,1.0,claude-opus-4-1-20250805,large-scale-text-editing,460.53846,True,0.6666666666666666,True,460.53846 +d8c266c5-877c-471c-a8ae-9ac1335dc80a,openai/gpt-oss-120b,together_ai,torch-tensor-parallelism,2063,1443,3506,78.420052,False,0.0,openai/gpt-oss-120b,torch-tensor-parallelism,78.420052,False,0.0,False,78.420052 +4950fe5c-3af4-45d7-a081-14d6a0e07d4c,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,prove-plus-comm,2574,3022,5596,918.028176,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,prove-plus-comm,918.028176,False,0.2,False,918.028176 +ed55c741-b0d2-4367-84f1-9d4083274d72,grok-4-0709,xai,build-pov-ray,19781,6141,25922,1766.543346,True,1.0,grok-4-0709,build-pov-ray,1766.543346,True,1.0,True,1766.543346 +275e8b82-891d-46de-a580-68ca4def2ee8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing,2835,2214,5049,273.046074,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing,273.046074,False,0.0,False,273.046074 +735c598a-47dd-4a40-a38b-f6951de5eb81,gpt-5-mini,openai,sanitize-git-repo,0,0,0,1002.411864,False,0.0,gpt-5-mini,sanitize-git-repo,1002.411864,False,0.0,False,1002.411864 +21e9f546-dc34-449a-8163-6f1fa434b641,gpt-5-mini,openai,dna-insert,964,2813,3777,387.555517,False,0.0,gpt-5-mini,dna-insert,387.555517,False,0.0,False,387.555517 +867b8355-51c6-448c-ab85-dd6c5f60f3c9,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,nginx-request-logging,6268,3807,10075,559.022787,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,nginx-request-logging,559.022787,False,0.4,False,559.022787 +688b62d2-8ddc-487e-b255-1b7c21b5d432,claude-sonnet-4-20250514,anthropic,build-pov-ray,19516,8156,27672,1843.132151,True,1.0,claude-sonnet-4-20250514,build-pov-ray,1843.132151,True,0.6,True,1843.132151 +7ac78740-c58b-4094-9c33-f21ac74c901c,gpt-5-nano,openai,password-recovery,3080,7124,10204,904.616632,False,0.0,gpt-5-nano,password-recovery,904.616632,False,0.0,False,904.616632 +e126aa9a-08cc-4aa1-bd15-81c5bcf483d4,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,train-fasttext,7636,3016,10652,495.528503,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,train-fasttext,495.528503,False,0.0,False,495.528503 +1e54ae00-bb5c-4ff1-b6d5-9909abe6e526,zai-org/GLM-4.5-Air-FP8,together_ai,merge-diff-arc-agi-task,21219,9898,31117,468.390265,False,0.0,zai-org/GLM-4.5-Air-FP8,merge-diff-arc-agi-task,468.390265,False,0.0,False,468.390265 +b2b6071d-00c1-4a2d-b8d9-b9749eb1470c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,video-processing,2470,1694,4164,742.73969,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,video-processing,742.73969,False,0.0,False,742.73969 +6c696321-e0b5-4a3d-8b7f-76898e5d6557,zai-org/GLM-4.5-Air-FP8,together_ai,password-recovery,4896,6944,11840,901.521805,False,0.0,zai-org/GLM-4.5-Air-FP8,password-recovery,901.521805,False,0.0,False,901.521805 +c132e1d5-f324-44eb-b955-54d601713052,gemini-2.5-flash,gemini,count-dataset-tokens,8100,3598,11698,303.303175,False,0.0,gemini-2.5-flash,count-dataset-tokens,303.303175,False,0.0,False,303.303175 +448fc72d-8763-484e-ac7e-ca04df78b9f2,OpenAI/gpt-oss-20B,together_ai,largest-eigenval,177,242,419,87.474697,False,0.0,OpenAI/gpt-oss-20B,largest-eigenval,87.474697,False,0.0,False,87.474697 +48158799-107d-421b-b34e-02fa5a8d38c5,OpenAI/gpt-oss-20B,together_ai,cancel-async-tasks,1378,729,2107,47.596013,False,0.0,OpenAI/gpt-oss-20B,cancel-async-tasks,47.596013,False,0.0,False,47.596013 +a84efdf1-6156-4caa-b18e-69f177573f3e,grok-code-fast-1,xai,hf-model-inference,3823,1215,5038,212.010365,False,0.0,grok-code-fast-1,hf-model-inference,212.010365,False,0.4,False,212.010365 +7beb5a4b-0a7e-4103-a813-40514f0b6da6,gpt-5,openai,regex-log,1716,1176,2892,238.699203,True,1.0,gpt-5,regex-log,238.699203,True,1.0,True,238.699203 +4e265d2e-cc3c-4f7f-8686-c594eaf39f70,OpenAI/gpt-oss-20B,together_ai,torch-tensor-parallelism,926,1346,2272,113.232244,False,0.0,OpenAI/gpt-oss-20B,torch-tensor-parallelism,113.232244,False,0.0,False,113.232244 +b7338317-329c-4329-a0a5-92c844ba3ec8,gpt-5-mini,openai,reshard-c4-data,6848,7792,14640,784.104237,False,0.0,gpt-5-mini,reshard-c4-data,784.104237,False,0.0,False,784.104237 +4d33822f-dd89-4688-b02b-ad502a70b8f4,deepseek-ai/DeepSeek-V3.1,together_ai,regex-log,1507,1033,2540,170.801851,False,0.0,deepseek-ai/DeepSeek-V3.1,regex-log,170.801851,False,0.2,False,170.801851 +cd8e5bda-3f26-41cb-a107-1c5930e29bbc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-alpine-ssh,4297,2288,6585,293.417581,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-alpine-ssh,293.417581,False,0.0,False,293.417581 +3e855e2b-0bdf-4f53-9db2-804d20315d0b,OpenAI/gpt-oss-20B,together_ai,make-doom-for-mips,2928,12285,15213,903.622876,False,0.0,OpenAI/gpt-oss-20B,make-doom-for-mips,903.622876,False,0.0,False,903.622876 +37eb3b9c-c908-48ed-9ed6-295e94dc022c,gemini-2.5-flash,gemini,password-recovery,3686,6686,10372,900.023634,False,0.0,gemini-2.5-flash,password-recovery,900.023634,False,0.0,False,900.023634 +9caadcea-65e0-46c4-a4b6-7cd8b1bca2ed,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-differential-cryptanalysis,4885,4378,9263,2458.036714,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-differential-cryptanalysis,2458.036714,False,0.0,False,2458.036714 +9ea7eb98-e1a0-458a-a270-fae9c246ab5e,gpt-5-mini,openai,path-tracing,22901,19614,42515,1555.892007,False,0.0,gpt-5-mini,path-tracing,1555.892007,False,0.0,False,1555.892007 +3fcff4d2-19a0-40ed-8ffd-2e7a86783840,claude-opus-4-1-20250805,anthropic,fix-ocaml-gc,44242,21134,65376,3681.242939,False,0.0,claude-opus-4-1-20250805,fix-ocaml-gc,3681.242939,False,0.5,False,3681.242939 +a9e1875e-b84d-47de-9f50-f60cbaff12ad,deepseek-ai/DeepSeek-V3.1,together_ai,count-dataset-tokens,13664,3056,16720,919.91295,False,0.0,deepseek-ai/DeepSeek-V3.1,count-dataset-tokens,919.91295,False,0.0,False,919.91295 +59473358-544b-4863-9c1a-1abb1bfebab5,deepseek-ai/DeepSeek-V3.1,together_ai,build-cython-ext,13164,4373,17537,906.657237,False,0.0,deepseek-ai/DeepSeek-V3.1,build-cython-ext,906.657237,False,0.0,False,906.657237 +207b7983-33b7-4300-a546-111d3aaeda87,claude-sonnet-4-20250514,anthropic,cobol-modernization,6991,5678,12669,640.959331,True,1.0,claude-sonnet-4-20250514,cobol-modernization,640.959331,True,1.0,True,640.959331 +428be7b3-6c27-44ad-8e77-08cdf281d012,OpenAI/gpt-oss-20B,together_ai,feal-linear-cryptanalysis,6047,19474,25521,1848.56029,False,0.0,OpenAI/gpt-oss-20B,feal-linear-cryptanalysis,1848.56029,False,0.0,False,1848.56029 +69b2f840-f461-4cc1-94e7-276ef22ba627,gemini-2.5-pro,gemini,schemelike-metacircular-eval,19986,29001,48987,1263.391927,False,0.0,gemini-2.5-pro,schemelike-metacircular-eval,1263.391927,False,0.0,False,1263.391927 +fcc48f6a-b8e3-470d-a3a8-e81424264169,gpt-5-nano,openai,pypi-server,6707,4552,11259,422.243813,True,1.0,gpt-5-nano,pypi-server,422.243813,True,0.8,True,422.243813 +e3a685c1-c023-4dca-a60b-83cd5c93342c,claude-sonnet-4-20250514,anthropic,winning-avg-corewars,13636,13338,26974,1086.853986,False,0.0,claude-sonnet-4-20250514,winning-avg-corewars,1086.853986,False,0.0,False,1086.853986 +51b8307e-370c-41c4-93be-ff181fecbe67,claude-sonnet-4-20250514,anthropic,merge-diff-arc-agi-task,12241,5028,17269,901.14175,False,0.0,claude-sonnet-4-20250514,merge-diff-arc-agi-task,901.14175,False,0.0,False,901.14175 +2260edc0-cc3b-4806-8f25-aa0efdb85130,gpt-5-nano,openai,build-initramfs-qemu,802,977,1779,96.907217,False,0.0,gpt-5-nano,build-initramfs-qemu,96.907217,False,0.0,False,96.907217 +b2072ee7-71b9-4ff6-a7fd-c3c994739765,claude-opus-4-1-20250805,anthropic,build-cython-ext,15838,4630,20468,906.73594,False,0.0,claude-opus-4-1-20250805,build-cython-ext,906.73594,False,0.0,False,906.73594 +7e1914a3-f12e-4639-851d-a4293f6350ac,OpenAI/gpt-oss-20B,together_ai,tune-mjcf,2915,11336,14251,901.769956,False,0.0,OpenAI/gpt-oss-20B,tune-mjcf,901.769956,False,0.0,False,901.769956 +4988957b-82fd-4bd5-979e-309eefc512b4,gemini-2.5-pro,gemini,build-pov-ray,21858,7656,29514,1672.216476,True,1.0,gemini-2.5-pro,build-pov-ray,1672.216476,True,1.0,True,1672.216476 +2111477c-5a7b-4738-9125-399df8e29567,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-klee-minimal,11657,4130,15787,907.342612,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-klee-minimal,907.342612,False,0.0,False,907.342612 +b6271fa9-0d5f-4238-84a7-888844ca4a1f,gpt-5,openai,nginx-request-logging,5012,1633,6645,180.570738,True,1.0,gpt-5,nginx-request-logging,180.570738,True,1.0,True,180.570738 +68198567-c72b-4ae6-8ce0-1fbf5a6ac135,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,large-scale-text-editing,5047,5481,10528,1211.410911,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,large-scale-text-editing,1211.410911,False,0.0,False,1211.410911 +6730bc51-36f3-4a1a-b59c-c60bfc78b64f,moonshotai/Kimi-K2-Instruct-0905,together_ai,configure-git-webserver,6244,2720,8964,915.02036,False,0.0,moonshotai/Kimi-K2-Instruct-0905,configure-git-webserver,915.02036,False,0.6,False,915.02036 +7daac61f-ef7f-4e79-899d-002f4b720853,claude-opus-4-1-20250805,anthropic,adaptive-rejection-sampler,15880,13728,29608,900.000748,True,1.0,claude-opus-4-1-20250805,adaptive-rejection-sampler,900.000748,True,0.125,True,900.000748 +61cef84b-cbbd-4dc2-a0f4-9bb24abb4beb,gemini-2.5-pro,gemini,gpt2-codegolf,5377,4961,10338,697.547094,False,0.0,gemini-2.5-pro,gpt2-codegolf,697.547094,False,0.0,False,697.547094 +639d9c82-f31c-480c-9096-f6e05b2e7cfa,deepseek-ai/DeepSeek-V3.1,together_ai,crack-7z-hash,9292,3554,12846,337.754947,True,1.0,deepseek-ai/DeepSeek-V3.1,crack-7z-hash,337.754947,True,0.8,True,337.754947 +c38990ca-d8d7-4995-9f45-0d9a0cc2a2e6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,git-leak-recovery,2558,2039,4597,173.514018,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,git-leak-recovery,173.514018,True,1.0,True,173.514018 +9c1ede3e-f4ae-426d-a6a0-be7be1d2816d,claude-opus-4-1-20250805,anthropic,dna-assembly,13712,8976,22688,285.310443,False,0.0,claude-opus-4-1-20250805,dna-assembly,285.310443,False,0.0,False,285.310443 +97915e07-1d7f-451b-b269-19cd05f766ea,claude-opus-4-1-20250805,anthropic,reverse-engineering,20321,15044,35365,1800.238053,False,0.0,claude-opus-4-1-20250805,reverse-engineering,1800.238053,False,0.0,False,1800.238053 +1d1a0003-1f74-4815-81f9-6c945bc39b7b,grok-4-0709,xai,crack-7z-hash,11585,3109,14694,900.02668,False,0.0,grok-4-0709,crack-7z-hash,900.02668,False,0.8,False,900.02668 +5d0ac4c3-8c0f-489f-ab07-d061377af674,zai-org/GLM-4.5-Air-FP8,together_ai,video-processing,3330,3101,6431,191.889484,False,0.0,zai-org/GLM-4.5-Air-FP8,video-processing,191.889484,False,0.0,False,191.889484 +566480d3-98cd-4f9b-a645-c9fb05491b44,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-git,5731,2953,8684,495.622287,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-git,495.622287,True,1.0,True,495.622287 +57e53842-e0e2-42a3-a262-7b131a3ea3d3,openai/gpt-oss-120b,together_ai,financial-document-processor,8364,3443,11807,287.284738,False,0.0,openai/gpt-oss-120b,financial-document-processor,287.284738,False,0.0,False,287.284738 +a46e4b00-776a-41de-82f2-681a009a697f,claude-opus-4-1-20250805,anthropic,largest-eigenval,16982,11458,28440,902.021514,True,1.0,claude-opus-4-1-20250805,largest-eigenval,902.021514,True,0.25,True,902.021514 +df842bec-2878-45f0-a123-7a8a5132dd70,claude-opus-4-1-20250805,anthropic,winning-avg-corewars,53650,48266,101916,3628.171085,False,0.0,claude-opus-4-1-20250805,winning-avg-corewars,3628.171085,False,0.3333333333333333,False,3628.171085 +d84a0485-ebfb-4fc4-ba22-1b893f5e9839,gpt-5-mini,openai,git-leak-recovery,6269,6695,12964,919.619248,False,0.0,gpt-5-mini,git-leak-recovery,919.619248,False,0.0,False,919.619248 +776ea66e-ef0f-4154-9bb4-d3894c794198,claude-sonnet-4-20250514,anthropic,vulnerable-secret,7832,9490,17322,900.147484,False,0.0,claude-sonnet-4-20250514,vulnerable-secret,900.147484,False,0.0,False,900.147484 +571ec257-dd9d-4d7f-8c59-f083668a729c,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-ocaml-gc,18894,7849,26743,1415.570426,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-ocaml-gc,1415.570426,False,0.0,False,1415.570426 +629b43e9-8e89-4f34-9004-6784580e5a67,gpt-5-nano,openai,install-klee-minimal,5527,3120,8647,900.000366,False,0.0,gpt-5-nano,install-klee-minimal,900.000366,False,0.0,False,900.000366 +07014b77-ca2a-49a1-853e-6a308973fa3c,claude-sonnet-4-20250514,anthropic,build-pmars,6296,1743,8039,2066.811023,False,0.0,claude-sonnet-4-20250514,build-pmars,2066.811023,False,0.6,False,2066.811023 +b863236d-e4ad-4172-87df-cf19becc41e8,gpt-5-mini,openai,schemelike-metacircular-eval,30106,37691,67797,2424.501503,False,0.0,gpt-5-mini,schemelike-metacircular-eval,2424.501503,False,0.0,False,2424.501503 +a39fa129-34d9-4c90-b6da-8f3ea4f94b0f,zai-org/GLM-4.5-Air-FP8,together_ai,sanitize-git-repo,12329,8245,20574,468.935086,False,0.0,zai-org/GLM-4.5-Air-FP8,sanitize-git-repo,468.935086,False,0.0,False,468.935086 +b4d29457-fa80-4b77-80e9-3d24f20b1deb,gemini-2.5-flash,gemini,password-recovery,2753,6001,8754,674.968792,False,0.0,gemini-2.5-flash,password-recovery,674.968792,False,0.0,False,674.968792 +deaee93e-694c-4911-bf71-32e8ba278a59,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,winning-avg-corewars,16591,11198,27789,1622.418055,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,winning-avg-corewars,1622.418055,False,0.0,False,1622.418055 +ee769c80-10c2-4044-b47f-7dba3b045a17,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-doom-for-mips,16320,3314,19634,919.006607,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-doom-for-mips,919.006607,False,0.0,False,919.006607 +d58cf7c7-1b18-4476-a66d-cd11b5ec9cd6,openai/gpt-oss-120b,together_ai,gpt2-codegolf,2146,6068,8214,490.102273,False,0.0,openai/gpt-oss-120b,gpt2-codegolf,490.102273,False,0.0,False,490.102273 +2d59f02d-79d7-4769-89dd-50f34083e522,OpenAI/gpt-oss-20B,together_ai,mteb-leaderboard,924,234,1158,97.476365,False,0.0,OpenAI/gpt-oss-20B,mteb-leaderboard,97.476365,False,0.0,False,97.476365 +9965d685-d878-4b90-88ea-70d1a885c6ca,claude-opus-4-1-20250805,anthropic,pytorch-model-cli,6511,4649,11160,191.97382,True,1.0,claude-opus-4-1-20250805,pytorch-model-cli,191.97382,True,0.4285714285714285,True,191.97382 +226ef884-f95c-4bcd-9819-5af4b59e1761,OpenAI/gpt-oss-20B,together_ai,video-processing,906,1508,2414,73.400203,False,0.0,OpenAI/gpt-oss-20B,video-processing,73.400203,False,0.0,False,73.400203 +eec40351-5054-4e5d-97df-533199651f11,gemini-2.5-flash,gemini,qemu-alpine-ssh,2913,2994,5907,302.902164,False,0.0,gemini-2.5-flash,qemu-alpine-ssh,302.902164,False,0.0,False,302.902164 +38b13cb1-e61d-4bd8-9b43-74c953ab9a22,claude-sonnet-4-20250514,anthropic,build-cython-ext,14795,5168,19963,900.001076,False,0.0,claude-sonnet-4-20250514,build-cython-ext,900.001076,False,0.0,False,900.001076 +edc946cf-9f32-47dc-82bf-06aeac0a763d,claude-opus-4-1-20250805,anthropic,feal-linear-cryptanalysis,14443,20693,35136,1800.225201,False,0.0,claude-opus-4-1-20250805,feal-linear-cryptanalysis,1800.225201,False,0.0,False,1800.225201 +09c22d0b-f237-40c9-9152-4aebe9883106,OpenAI/gpt-oss-20B,together_ai,polyglot-rust-c,222,1735,1957,115.479496,False,0.0,OpenAI/gpt-oss-20B,polyglot-rust-c,115.479496,False,0.0,False,115.479496 +9f4fd13d-98f2-4b1d-95e5-a5b3141c2bde,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-c-py,3825,2409,6234,72.777524,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-c-py,72.777524,False,0.0,False,72.777524 +257d5b40-f86a-4c2b-be54-78e1215ab6b9,zai-org/GLM-4.5-Air-FP8,together_ai,circuit-fibsqrt,25548,50400,75948,2126.641662,False,0.0,zai-org/GLM-4.5-Air-FP8,circuit-fibsqrt,2126.641662,False,0.0,False,2126.641662 +31abb7ed-a7dd-4710-ae5e-767265e5c6e9,gemini-2.5-pro,gemini,db-wal-recovery,4271,3434,7705,462.198917,False,0.0,gemini-2.5-pro,db-wal-recovery,462.198917,False,0.0,False,462.198917 +de6ed5ff-979b-4f3c-99af-c85672494188,claude-sonnet-4-20250514,anthropic,chess-best-move,6684,5477,12161,182.596906,False,0.0,claude-sonnet-4-20250514,chess-best-move,182.596906,False,0.0,False,182.596906 +b09d1d86-61a0-4f16-be74-d1683d6bc58d,claude-sonnet-4-20250514,anthropic,make-doom-for-mips,22083,6282,28365,905.482606,False,0.0,claude-sonnet-4-20250514,make-doom-for-mips,905.482606,False,0.0,False,905.482606 +7f59c512-03fe-4737-9774-375f98faaf12,claude-opus-4-1-20250805,anthropic,make-doom-for-mips,20328,6042,26370,906.140076,False,0.0,claude-opus-4-1-20250805,make-doom-for-mips,906.140076,False,0.0,False,906.140076 +27434c92-02fc-44e2-bc19-28c830395c9b,grok-code-fast-1,xai,winning-avg-corewars,3983,1109,5092,107.45215,False,0.0,grok-code-fast-1,winning-avg-corewars,107.45215,False,0.0,False,107.45215 +661c1ce4-03fd-4b3c-b569-a8214bb66519,gpt-5,openai,feal-linear-cryptanalysis,17771,13578,31349,1413.234163,True,1.0,gpt-5,feal-linear-cryptanalysis,1413.234163,True,1.0,True,1413.234163 +3db7084b-51c4-4a32-831b-8e7fb7b7d3e7,claude-sonnet-4-20250514,anthropic,circuit-fibsqrt,14181,15368,29549,1484.809645,False,0.0,claude-sonnet-4-20250514,circuit-fibsqrt,1484.809645,False,0.0,False,1484.809645 +c930e187-e83f-48c5-a4ca-b9ff889210c8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing,5691,5310,11001,602.096762,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing,602.096762,False,0.0,False,602.096762 +9a73c9f9-f9a9-4663-bb81-f19141d6e5c1,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-cli,9832,5779,15611,411.493578,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-cli,411.493578,False,0.0,False,411.493578 +d2cc7b3a-fb7f-4e08-ba54-9d0c3c11d2cd,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-insert,4842,778,5620,360.00195,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-insert,360.00195,False,0.0,False,360.00195 +1091c897-9654-4089-9768-38fc36b93809,gpt-5,openai,nginx-request-logging,4154,1531,5685,197.444026,True,1.0,gpt-5,nginx-request-logging,197.444026,True,1.0,True,197.444026 +38448196-935c-445d-ab11-3e4b713f8da0,gpt-5,openai,large-scale-text-editing,4278,3832,8110,1241.365031,False,0.0,gpt-5,large-scale-text-editing,1241.365031,False,0.4285714285714285,False,1241.365031 +f4b565ee-d020-4275-b01c-2f537519bee1,grok-4-0709,xai,tune-mjcf,3756,2579,6335,929.268954,False,0.0,grok-4-0709,tune-mjcf,929.268954,False,0.0,False,929.268954 +a322daa4-5bd5-44b2-ac24-f699a5301179,OpenAI/gpt-oss-20B,together_ai,cancel-async-tasks,1162,531,1693,15.837117,False,0.0,OpenAI/gpt-oss-20B,cancel-async-tasks,15.837117,False,0.0,False,15.837117 +d4fbfa17-af3b-434f-a6d5-8ab775139c52,gpt-5-mini,openai,regex-log,1551,909,2460,171.2817,True,1.0,gpt-5-mini,regex-log,171.2817,True,0.8,True,171.2817 +5e5bf6ea-c454-4c8c-b20f-aa5e662b6415,gpt-5-mini,openai,fix-git,6490,4134,10624,380.362449,True,1.0,gpt-5-mini,fix-git,380.362449,True,0.6,True,380.362449 +51087244-cf29-421a-aa48-040bb72177c5,openai/gpt-oss-120b,together_ai,fix-git,11067,4631,15698,420.166207,True,1.0,openai/gpt-oss-120b,fix-git,420.166207,True,0.6,True,420.166207 +b90c822e-69ca-49bb-bb60-4d22384970f7,grok-code-fast-1,xai,circuit-fibsqrt,4291,2740,7031,310.520974,False,0.0,grok-code-fast-1,circuit-fibsqrt,310.520974,False,0.0,False,310.520974 +81c631c5-77cd-4231-80df-01857bd8a03d,claude-opus-4-1-20250805,anthropic,cancel-async-tasks,3419,2774,6193,323.441293,False,0.0,claude-opus-4-1-20250805,cancel-async-tasks,323.441293,False,0.125,False,323.441293 +eabd3d58-5bb4-4d58-b80f-845cdd96e3f0,grok-4-0709,xai,fix-ocaml-gc,28394,11796,40190,3600.003152,False,0.0,grok-4-0709,fix-ocaml-gc,3600.003152,False,0.0,False,3600.003152 +d09e362d-8bac-4f15-8c38-aea6f8bb3d68,gpt-5,openai,extract-elf,2576,3127,5703,114.179744,False,0.0,gpt-5,extract-elf,114.179744,False,0.2857142857142857,False,114.179744 +2604cc6e-eaaa-4f21-856b-452c53472eb6,gemini-2.5-pro,gemini,feal-differential-cryptanalysis,2713,1833,4546,669.841014,True,1.0,gemini-2.5-pro,feal-differential-cryptanalysis,669.841014,True,0.6,True,669.841014 +f7ca3fe2-4ea0-406b-8f53-d01482eb21fe,claude-sonnet-4-20250514,anthropic,constraints-scheduling,6248,3500,9748,290.927141,True,1.0,claude-sonnet-4-20250514,constraints-scheduling,290.927141,True,1.0,True,290.927141 +4a558285-b12b-41a1-b4db-6b634aaabadf,gemini-2.5-pro,gemini,nginx-request-logging,3796,1847,5643,396.030978,False,0.0,gemini-2.5-pro,nginx-request-logging,396.030978,False,0.6,False,396.030978 +66f07cd7-3358-4af9-b076-f2572a615b71,claude-opus-4-1-20250805,anthropic,build-cython-ext,11070,2617,13687,908.751913,False,0.0,claude-opus-4-1-20250805,build-cython-ext,908.751913,False,0.0,False,908.751913 +136f4164-95d3-477b-9baf-e01a4459b77c,gemini-2.5-flash,gemini,git-leak-recovery,1279,1162,2441,131.339016,False,0.0,gemini-2.5-flash,git-leak-recovery,131.339016,False,0.6,False,131.339016 +8f35d819-3c21-453e-b571-88d244f16692,gpt-5,openai,winning-avg-corewars,31508,29368,60876,3621.26844,False,0.0,gpt-5,winning-avg-corewars,3621.26844,False,0.2857142857142857,False,3621.26844 +e1a62e76-4b7c-4a2a-96ce-5be16a5e5084,moonshotai/Kimi-K2-Instruct-0905,together_ai,cancel-async-tasks,2494,1859,4353,896.774426,True,1.0,moonshotai/Kimi-K2-Instruct-0905,cancel-async-tasks,896.774426,True,0.6,True,896.774426 +840a0d3b-6647-4c8f-a6e8-148678c1c146,openai/gpt-oss-120b,together_ai,adaptive-rejection-sampler,8339,7770,16109,902.183438,False,0.0,openai/gpt-oss-120b,adaptive-rejection-sampler,902.183438,False,0.0,False,902.183438 +e44839c0-6f4c-47c7-8fb6-1042c44f9ba7,gpt-5,openai,constraints-scheduling,4424,1816,6240,181.470067,True,1.0,gpt-5,constraints-scheduling,181.470067,True,0.8571428571428571,True,181.470067 +2c356500-e109-47d1-8d8c-73db20b46c7f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,log-summary-date-ranges,9553,3549,13102,190.140815,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,log-summary-date-ranges,190.140815,False,0.8,False,190.140815 +502642eb-5cb7-4ed0-8925-7b6914690fb8,claude-opus-4-1-20250805,anthropic,chess-best-move,7848,7376,15224,336.264846,False,0.0,claude-opus-4-1-20250805,chess-best-move,336.264846,False,0.0,False,336.264846 +cae55284-767b-4ebd-86ef-3e06a9b9bbd1,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,nginx-request-logging,3614,2287,5901,126.59226,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,nginx-request-logging,126.59226,False,0.0,False,126.59226 +2185e680-7be3-45a7-b474-e30a7c0d93ed,OpenAI/gpt-oss-20B,together_ai,write-compressor,3748,17598,21346,906.86461,False,0.0,OpenAI/gpt-oss-20B,write-compressor,906.86461,False,0.0,False,906.86461 +e3611a25-15fb-4f34-a966-71e930cfbeab,OpenAI/gpt-oss-20B,together_ai,polyglot-c-py,243,915,1158,105.069729,False,0.0,OpenAI/gpt-oss-20B,polyglot-c-py,105.069729,False,0.0,False,105.069729 +bbfbdd21-7111-4e3c-b5dd-14c472fb6825,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,largest-eigenval,6460,5493,11953,553.179561,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,largest-eigenval,553.179561,False,0.2,False,553.179561 +d9d4c2a0-b05b-47a5-8a87-0c9ae741b314,gpt-5-mini,openai,winning-avg-corewars,18768,11719,30487,3600.046057,False,0.0,gpt-5-mini,winning-avg-corewars,3600.046057,False,0.0,False,3600.046057 +1054b191-da06-4c38-ae19-80558f15013d,gpt-5-nano,openai,mteb-leaderboard,11238,13735,24973,1732.246102,False,0.0,gpt-5-nano,mteb-leaderboard,1732.246102,False,0.0,False,1732.246102 +66404b00-9bee-4340-b1c6-87139906e5f4,openai/gpt-oss-120b,together_ai,make-doom-for-mips,14656,4416,19072,900.074141,False,0.0,openai/gpt-oss-120b,make-doom-for-mips,900.074141,False,0.0,False,900.074141 +891564a4-b4ae-41c9-8a79-7d93d786baef,openai/gpt-oss-120b,together_ai,tune-mjcf,9498,9856,19354,904.484652,False,0.0,openai/gpt-oss-120b,tune-mjcf,904.484652,False,0.2,False,904.484652 +45321289-eb82-4da9-baf1-67854c074334,grok-4-0709,xai,wasm-pipeline,7611,3506,11117,919.291095,False,0.0,grok-4-0709,wasm-pipeline,919.291095,False,0.4,False,919.291095 +9eb34595-3c66-4ac0-ae58-bc728fa1c68f,grok-4-0709,xai,regex-log,1350,669,2019,235.37137,False,0.0,grok-4-0709,regex-log,235.37137,False,0.6,False,235.37137 +a92e3751-ad7e-4a1a-8155-801e3208f1e0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,log-summary-date-ranges,9419,3837,13256,200.016045,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,log-summary-date-ranges,200.016045,True,0.8,True,200.016045 +ea32f06a-ec71-4e67-957e-8463e4794b2d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-insert,8664,4507,13171,395.821054,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-insert,395.821054,False,0.0,False,395.821054 +c5382eab-2619-4eab-bcd7-a399476c9e49,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,git-leak-recovery,2287,1530,3817,145.433655,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,git-leak-recovery,145.433655,True,1.0,True,145.433655 +1dbac28f-2e0c-4516-9e2f-460a389c2edf,deepseek-ai/DeepSeek-V3.1,together_ai,gpt2-codegolf,4893,5464,10357,334.100522,False,0.0,deepseek-ai/DeepSeek-V3.1,gpt2-codegolf,334.100522,False,0.0,False,334.100522 +85005041-a156-4014-a23c-38a277c4655b,gemini-2.5-pro,gemini,cobol-modernization,4830,3531,8361,316.468453,True,1.0,gemini-2.5-pro,cobol-modernization,316.468453,True,1.0,True,316.468453 +345e0b57-6323-4dcb-9584-e12f9630348a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-initramfs-qemu,6027,2754,8781,907.695081,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-initramfs-qemu,907.695081,False,0.0,False,907.695081 +f3d5209f-75c1-469d-a2f2-394a1e52c804,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,schemelike-metacircular-eval,20907,15291,36198,2406.472815,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,schemelike-metacircular-eval,2406.472815,False,0.0,False,2406.472815 +695faf9b-b8af-430e-a571-2a7cf773aa4d,OpenAI/gpt-oss-20B,together_ai,wasm-pipeline,191,1260,1451,154.709775,False,0.0,OpenAI/gpt-oss-20B,wasm-pipeline,154.709775,False,0.0,False,154.709775 +948b46f9-4622-4d42-aaf8-8181f0dc4eb6,claude-sonnet-4-20250514,anthropic,polyglot-c-py,5986,3701,9687,284.25121,False,0.0,claude-sonnet-4-20250514,polyglot-c-py,284.25121,False,0.0,False,284.25121 +5331c57d-b7e2-4004-9bba-8a01fded8bf2,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,db-wal-recovery,2008,1786,3794,152.173643,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,db-wal-recovery,152.173643,False,0.0,False,152.173643 +6ba6f338-43c3-4f33-918e-267177f98468,openai/gpt-oss-120b,together_ai,bn-fit-modify,4701,4057,8758,1834.933602,False,0.0,openai/gpt-oss-120b,bn-fit-modify,1834.933602,False,0.2,False,1834.933602 +23bfc685-cbb6-4c5c-b82e-bc461cb3aa8f,gpt-5-nano,openai,crack-7z-hash,1307,819,2126,64.506897,False,0.0,gpt-5-nano,crack-7z-hash,64.506897,False,0.0,False,64.506897 +131e5124-bb20-4ad5-aa84-74e8a013b13f,deepseek-ai/DeepSeek-V3.1,together_ai,dna-assembly,11884,7663,19547,245.836465,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-assembly,245.836465,False,0.0,False,245.836465 +c191e077-3d47-465c-84df-b42e5c0cfc1b,claude-opus-4-1-20250805,anthropic,form-filling,6344,4318,10662,258.675238,True,1.0,claude-opus-4-1-20250805,form-filling,258.675238,True,1.0,True,258.675238 +fd093889-93f5-47c5-95d3-d0847d43aad2,deepseek-ai/DeepSeek-V3.1,together_ai,filter-js-from-html,3034,2385,5419,465.015467,False,0.0,deepseek-ai/DeepSeek-V3.1,filter-js-from-html,465.015467,False,0.0,False,465.015467 +c3712e0c-b40a-44b2-8f96-38127fc70fca,gpt-5-nano,openai,build-pmars,15042,7667,22709,914.867195,False,0.0,gpt-5-nano,build-pmars,914.867195,False,0.0,False,914.867195 +bb27bd2e-4406-481f-8aa2-506ea6a4bf36,gpt-5-mini,openai,configure-git-webserver,1674,1900,3574,460.030772,False,0.0,gpt-5-mini,configure-git-webserver,460.030772,False,0.6,False,460.030772 +44091860-050c-4600-b44f-33e55237725a,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-leaderboard,18836,14185,33021,495.409632,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-leaderboard,495.409632,False,0.0,False,495.409632 +2da9257d-d798-45cc-934b-cec9f4474f82,deepseek-ai/DeepSeek-V3.1,together_ai,build-initramfs-qemu,7133,6000,13133,902.509799,False,0.0,deepseek-ai/DeepSeek-V3.1,build-initramfs-qemu,902.509799,False,0.0,False,902.509799 +9f80c14f-16be-40a1-a6b3-8b56d668238a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-mips-interpreter,28475,21118,49593,1111.243218,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-mips-interpreter,1111.243218,False,0.0,False,1111.243218 +55386ba2-3251-4485-8ccf-3be1c12d3f94,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-recovery,9359,6388,15747,285.598543,True,1.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-recovery,285.598543,True,0.6,True,285.598543 +35a419d4-b010-4931-b994-586c5b879f71,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-cli,11466,11697,23163,782.216051,False,0.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-cli,782.216051,False,0.0,False,782.216051 +c7bd6d87-71aa-4122-b265-9dfb78ebfcda,OpenAI/gpt-oss-20B,together_ai,vulnerable-secret,4332,18101,22433,900.319148,False,0.0,OpenAI/gpt-oss-20B,vulnerable-secret,900.319148,False,0.0,False,900.319148 +b56252ee-d633-4bd0-9bea-ea320aa08563,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,filter-js-from-html,6172,6293,12465,465.860672,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,filter-js-from-html,465.860672,False,0.0,False,465.860672 +73334acf-c2d6-4d74-9cd5-1df50690103d,grok-code-fast-1,xai,largest-eigenval,7554,3351,10905,908.582583,False,0.0,grok-code-fast-1,largest-eigenval,908.582583,False,0.0,False,908.582583 +2622034c-f0f0-43a7-b181-c0029ace9380,deepseek-ai/DeepSeek-V3.1,together_ai,openssl-selfsigned-cert,4161,3816,7977,552.602063,True,1.0,deepseek-ai/DeepSeek-V3.1,openssl-selfsigned-cert,552.602063,True,1.0,True,552.602063 +7c09e20f-6bf7-482b-89a5-23a9d356d053,moonshotai/Kimi-K2-Instruct-0905,together_ai,winning-avg-corewars,11280,11124,22404,1136.614409,False,0.0,moonshotai/Kimi-K2-Instruct-0905,winning-avg-corewars,1136.614409,False,0.0,False,1136.614409 +55f435f7-9ef3-47f7-b0a7-eabab131c186,gpt-5-nano,openai,financial-document-processor,20268,12144,32412,761.460402,False,0.0,gpt-5-nano,financial-document-processor,761.460402,False,0.0,False,761.460402 +6ccc8c1a-2433-4123-ae3e-7d6bb58f5d19,OpenAI/gpt-oss-20B,together_ai,build-pov-ray,2733,6547,9280,788.412803,False,0.0,OpenAI/gpt-oss-20B,build-pov-ray,788.412803,False,0.0,False,788.412803 +003b211c-0f55-453c-ba5a-1d22b4d3bd96,gpt-5-mini,openai,reverse-engineering,32482,19110,51592,1800.564711,False,0.0,gpt-5-mini,reverse-engineering,1800.564711,False,0.0,False,1800.564711 +e38e2f6a-fa9c-46ee-8e52-aac36a14d442,gpt-5-mini,openai,install-windows-3.11,4670,2548,7218,348.12997,False,0.0,gpt-5-mini,install-windows-3.11,348.12997,False,0.0,False,348.12997 +4e117788-96a1-4cb6-b13f-6f4f89d29c5d,claude-opus-4-1-20250805,anthropic,pypi-server,6004,3051,9055,290.260019,True,1.0,claude-opus-4-1-20250805,pypi-server,290.260019,True,1.0,True,290.260019 +dc4a31c6-85a4-44cc-83ed-69c1cb29de6e,grok-code-fast-1,xai,large-scale-text-editing,2883,2177,5060,208.982002,False,0.0,grok-code-fast-1,large-scale-text-editing,208.982002,False,0.0,False,208.982002 +0d25dc58-aca6-4096-a523-7d8af94be74e,claude-opus-4-1-20250805,anthropic,tune-mjcf,6027,5038,11065,900.001224,False,0.0,claude-opus-4-1-20250805,tune-mjcf,900.001224,False,0.25,False,900.001224 +dae63725-cd6a-488a-a0b7-0442580f9738,claude-opus-4-1-20250805,anthropic,cancel-async-tasks,2629,2319,4948,76.752674,False,0.0,claude-opus-4-1-20250805,cancel-async-tasks,76.752674,False,0.125,False,76.752674 +a1c06619-d5b9-456a-907f-3584559f0909,grok-4-0709,xai,circuit-fibsqrt,3973,1179,5152,3627.213903,False,0.0,grok-4-0709,circuit-fibsqrt,3627.213903,False,0.0,False,3627.213903 +967cf96f-8ea3-4075-86f3-3fbf3594e5c7,moonshotai/Kimi-K2-Instruct-0905,together_ai,schemelike-metacircular-eval,28801,24837,53638,2410.727038,False,0.0,moonshotai/Kimi-K2-Instruct-0905,schemelike-metacircular-eval,2410.727038,False,0.0,False,2410.727038 +45d38a12-2f53-4e66-899d-f533b5abcc7b,gpt-5-nano,openai,polyglot-c-py,3030,4703,7733,254.236836,False,0.0,gpt-5-nano,polyglot-c-py,254.236836,False,0.0,False,254.236836 +29f7ddba-4e76-4cac-9614-5e79e5eba6dc,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-startup,2034,1516,3550,81.613233,False,0.0,deepseek-ai/DeepSeek-V3.1,qemu-startup,81.613233,False,0.2,False,81.613233 +c19d4e24-023a-4add-b057-7000c90bb0a6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,prove-plus-comm,2066,1781,3847,171.709209,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,prove-plus-comm,171.709209,True,0.2,True,171.709209 +21af24ea-410b-4846-98cc-d6e5258f1c09,gpt-5,openai,port-compressor,22565,34549,57114,3605.937222,False,0.0,gpt-5,port-compressor,3605.937222,False,0.0,False,3605.937222 +d1f205aa-ab0a-4f98-b5bd-b01f51f6129b,gpt-5-mini,openai,configure-git-webserver,4484,1587,6071,270.607702,False,0.0,gpt-5-mini,configure-git-webserver,270.607702,False,0.6,False,270.607702 +8d3d070d-8515-4ad5-b7f0-936792fc7074,claude-opus-4-1-20250805,anthropic,dna-assembly,23808,12229,36037,720.510238,False,0.0,claude-opus-4-1-20250805,dna-assembly,720.510238,False,0.0,False,720.510238 +af3ae81f-df7c-4270-9ecf-a0aa24a03b75,claude-opus-4-1-20250805,anthropic,code-from-image,28322,25708,54030,1210.201027,False,0.0,claude-opus-4-1-20250805,code-from-image,1210.201027,False,0.125,False,1210.201027 +4f0c8ed6-bccf-4714-a72d-0783b6d98c07,zai-org/GLM-4.5-Air-FP8,together_ai,log-summary-date-ranges,6401,1660,8061,248.297571,False,0.0,zai-org/GLM-4.5-Air-FP8,log-summary-date-ranges,248.297571,False,0.8,False,248.297571 +955dd949-ce74-4963-b2bc-68d40ea37c0e,OpenAI/gpt-oss-20B,together_ai,path-tracing,624,1170,1794,136.590739,False,0.0,OpenAI/gpt-oss-20B,path-tracing,136.590739,False,0.0,False,136.590739 +1eb8980a-30fb-430c-9943-c8c0dd682126,openai/gpt-oss-120b,together_ai,model-extraction-relu-logits,1560,782,2342,330.267988,False,0.0,openai/gpt-oss-120b,model-extraction-relu-logits,330.267988,False,0.0,False,330.267988 +76e1a9b1-2efb-4747-89e7-ff252702bcf9,gemini-2.5-flash,gemini,openssl-selfsigned-cert,1998,1306,3304,71.064142,False,0.0,gemini-2.5-flash,openssl-selfsigned-cert,71.064142,False,0.0,False,71.064142 +e6ca1f78-1b81-496f-8043-b1114189bb1d,gpt-5-mini,openai,install-klee-minimal,4321,2202,6523,900.615276,False,0.0,gpt-5-mini,install-klee-minimal,900.615276,False,0.0,False,900.615276 +ed0414d2-8d05-4cd4-8499-6d9bd4dc9b94,moonshotai/Kimi-K2-Instruct-0905,together_ai,log-summary-date-ranges,9070,3603,12673,337.784765,True,1.0,moonshotai/Kimi-K2-Instruct-0905,log-summary-date-ranges,337.784765,True,0.8,True,337.784765 +9d56ce29-ed76-4b8d-930f-13bc9f52d980,gpt-5-nano,openai,install-windows-3.11,12403,18982,31385,3690.493455,False,0.0,gpt-5-nano,install-windows-3.11,3690.493455,False,0.0,False,3690.493455 +e528c6d2-364a-4733-9e8b-45df229c6e62,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,regex-log,5778,6522,12300,595.950667,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,regex-log,595.950667,False,0.2,False,595.950667 +2aadb4a7-acb4-4c8e-8744-ba5f6f68196c,openai/gpt-oss-120b,together_ai,extract-elf,6218,6978,13196,231.194484,False,0.0,openai/gpt-oss-120b,extract-elf,231.194484,False,0.4,False,231.194484 +3554d0d3-49c2-4c35-b1e8-b114edcccde7,gemini-2.5-flash,gemini,pypi-server,9156,2728,11884,460.690822,False,0.0,gemini-2.5-flash,pypi-server,460.690822,False,0.0,False,460.690822 +6b44baac-48e9-4290-819a-c9a58bb81d1a,zai-org/GLM-4.5-Air-FP8,together_ai,build-initramfs-qemu,8029,4577,12606,447.428323,False,0.0,zai-org/GLM-4.5-Air-FP8,build-initramfs-qemu,447.428323,False,0.0,False,447.428323 +eef73477-a988-43f9-8501-ab54dbab36b0,grok-4-0709,xai,winning-avg-corewars,12632,14875,27507,3616.264834,False,0.0,grok-4-0709,winning-avg-corewars,3616.264834,False,0.0,False,3616.264834 +22e75e91-a347-4cbd-ac29-4f080beca403,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-insert,15661,6499,22160,378.54079,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-insert,378.54079,False,0.0,False,378.54079 +abb5fa06-95cd-4911-b085-7ab0e2d7520c,gemini-2.5-pro,gemini,distribution-search,8677,10668,19345,748.86701,True,1.0,gemini-2.5-pro,distribution-search,748.86701,True,0.6,True,748.86701 +a15d21ff-d07f-45c6-a446-c82bb92fb37b,gemini-2.5-flash,gemini,build-pov-ray,9208,8848,18056,1283.197018,False,0.0,gemini-2.5-flash,build-pov-ray,1283.197018,False,0.0,False,1283.197018 +b1c4728f-641a-406d-a1b6-1f5dabc607c8,claude-sonnet-4-20250514,anthropic,write-compressor,8782,8375,17157,904.585595,False,0.0,claude-sonnet-4-20250514,write-compressor,904.585595,False,0.0,False,904.585595 +a1875ad8-1a4e-4f8a-8050-686003be6920,OpenAI/gpt-oss-20B,together_ai,fix-code-vulnerability,3604,18246,21850,904.798113,False,0.0,OpenAI/gpt-oss-20B,fix-code-vulnerability,904.798113,False,0.0,False,904.798113 +68c94c50-4321-4aee-991b-80bad70c0e66,moonshotai/Kimi-K2-Instruct-0905,together_ai,distribution-search,6182,5955,12137,582.754334,True,1.0,moonshotai/Kimi-K2-Instruct-0905,distribution-search,582.754334,True,0.2,True,582.754334 +d4162ea2-8493-4e15-a5f6-bc1dd14ec251,grok-4-0709,xai,git-leak-recovery,1259,645,1904,290.075708,False,0.0,grok-4-0709,git-leak-recovery,290.075708,False,0.4,False,290.075708 +1b8d5412-2245-4426-8e18-b282f7f51905,gemini-2.5-flash,gemini,mteb-retrieve,2266,2226,4492,397.667136,False,0.0,gemini-2.5-flash,mteb-retrieve,397.667136,False,0.0,False,397.667136 +d45e9d1a-a50f-49a1-9c67-c9bcfc90a003,zai-org/GLM-4.5-Air-FP8,together_ai,sanitize-git-repo,10524,3572,14096,379.461879,False,0.0,zai-org/GLM-4.5-Air-FP8,sanitize-git-repo,379.461879,False,0.0,False,379.461879 +16042bc7-3c75-495d-b562-021f08b2a053,claude-opus-4-1-20250805,anthropic,feal-differential-cryptanalysis,22216,22132,44348,1807.272191,False,0.0,claude-opus-4-1-20250805,feal-differential-cryptanalysis,1807.272191,False,0.0,False,1807.272191 +f6267b9b-acac-4681-bc23-6ff71e6b2205,gemini-2.5-pro,gemini,build-cython-ext,17979,6113,24092,907.970203,False,0.0,gemini-2.5-pro,build-cython-ext,907.970203,False,0.0,False,907.970203 +ed80baff-a9c9-4ae3-8c34-ca917dddbf67,gpt-5-mini,openai,install-klee-minimal,2124,2312,4436,900.000808,False,0.0,gpt-5-mini,install-klee-minimal,900.000808,False,0.0,False,900.000808 +260cd378-8b62-4c46-9701-2d6db990c7f0,grok-code-fast-1,xai,cobol-modernization,4650,2183,6833,141.010751,True,1.0,grok-code-fast-1,cobol-modernization,141.010751,True,0.6,True,141.010751 +45a7bbf1-8574-4af4-b6fd-87a10037f3ec,grok-4-0709,xai,gpt2-codegolf,1054,492,1546,342.080994,False,0.0,grok-4-0709,gpt2-codegolf,342.080994,False,0.0,False,342.080994 +baa9e22c-fdca-4106-8713-fd1d9f18055d,gemini-2.5-flash,gemini,pytorch-model-cli,4269,1609,5878,137.913301,False,0.0,gemini-2.5-flash,pytorch-model-cli,137.913301,False,0.0,False,137.913301 +a68fb259-b4ef-4aca-ae0c-4907817dd7d3,gpt-5,openai,git-leak-recovery,2551,1766,4317,293.401903,True,1.0,gpt-5,git-leak-recovery,293.401903,True,0.7142857142857143,True,293.401903 +dd953812-6179-4c1c-9d14-ed0d9f17605e,gpt-5-mini,openai,reshard-c4-data,2432,3878,6310,200.233277,False,0.0,gpt-5-mini,reshard-c4-data,200.233277,False,0.0,False,200.233277 +fc3994c7-1b37-4348-a627-386c2c3e9cf1,gpt-5-nano,openai,regex-log,7778,9610,17388,900.00096,False,0.0,gpt-5-nano,regex-log,900.00096,False,0.2,False,900.00096 +e4aa94c8-ec8b-4fbd-ab1e-66ad614990e1,claude-opus-4-1-20250805,anthropic,bn-fit-modify,11671,4993,16664,492.502431,True,1.0,claude-opus-4-1-20250805,bn-fit-modify,492.502431,True,0.875,True,492.502431 +6ae836ef-016c-4891-9b0e-f83f7f89513a,claude-opus-4-1-20250805,anthropic,openssl-selfsigned-cert,5118,3968,9086,356.479367,True,1.0,claude-opus-4-1-20250805,openssl-selfsigned-cert,356.479367,True,1.0,True,356.479367 +6eea71e2-c8c0-4eef-96ba-53e6ae258e4c,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pmars,14543,3761,18304,904.621618,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pmars,904.621618,True,1.0,True,904.621618 +060e3775-b180-4a6d-85c2-055f115ddffd,claude-opus-4-1-20250805,anthropic,password-recovery,10117,7764,17881,638.741134,False,0.0,claude-opus-4-1-20250805,password-recovery,638.741134,False,0.5555555555555556,False,638.741134 +4d195acf-28e9-434f-abbc-be91853b8e4a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing,4057,4485,8542,357.47181,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing,357.47181,False,0.0,False,357.47181 +599ac243-d17f-4296-93a6-dd29dd392cf5,grok-4-0709,xai,pypi-server,6792,1762,8554,907.239492,True,1.0,grok-4-0709,pypi-server,907.239492,True,0.4,True,907.239492 +f03b45d5-6407-41be-a73b-a770d3f42327,OpenAI/gpt-oss-20B,together_ai,pytorch-model-recovery,2165,7706,9871,905.398722,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-recovery,905.398722,False,0.0,False,905.398722 +94bcdadf-25b2-4e47-8082-25ed7da15410,claude-sonnet-4-20250514,anthropic,break-filter-js-from-html,15443,13016,28459,1200.644363,False,0.0,claude-sonnet-4-20250514,break-filter-js-from-html,1200.644363,False,0.0,False,1200.644363 +40105664-d7d9-4161-aa81-fbe8ecc3d460,claude-sonnet-4-20250514,anthropic,qemu-startup,1553,1411,2964,915.963414,True,1.0,claude-sonnet-4-20250514,qemu-startup,915.963414,True,0.4,True,915.963414 +dedfc082-a80d-4c5c-89af-924c1e36c9f3,gpt-5-nano,openai,regex-log,6573,6541,13114,905.945441,False,0.0,gpt-5-nano,regex-log,905.945441,False,0.2,False,905.945441 +3b0cee7f-69dd-461c-8b31-5703dda6931c,gemini-2.5-flash,gemini,constraints-scheduling,5277,4857,10134,386.337337,False,0.0,gemini-2.5-flash,constraints-scheduling,386.337337,False,0.4,False,386.337337 +1178f2ce-aa25-4ec5-a591-edcc4f737bdc,claude-opus-4-1-20250805,anthropic,port-compressor,70558,45394,115952,3921.859939,False,0.0,claude-opus-4-1-20250805,port-compressor,3921.859939,False,0.0,False,3921.859939 +fe3a0b41-9395-42e0-8625-6b2ea3dffa72,claude-opus-4-1-20250805,anthropic,openssl-selfsigned-cert,2819,2474,5293,96.531413,True,1.0,claude-opus-4-1-20250805,openssl-selfsigned-cert,96.531413,True,1.0,True,96.531413 +062ca169-0225-4aef-9012-6eeeac6c0327,grok-code-fast-1,xai,polyglot-rust-c,1103,572,1675,134.266409,False,0.0,grok-code-fast-1,polyglot-rust-c,134.266409,False,0.0,False,134.266409 +5cd64d2d-72fe-4d1f-88c7-2b8aa81ef600,gemini-2.5-flash,gemini,sqlite-with-gcov,1575,1235,2810,310.82023,False,0.0,gemini-2.5-flash,sqlite-with-gcov,310.82023,False,0.2,False,310.82023 +9200626e-5e9f-4f21-b9cb-ea295228b32d,grok-4-0709,xai,log-summary-date-ranges,2225,2622,4847,328.253905,False,0.0,grok-4-0709,log-summary-date-ranges,328.253905,False,0.0,False,328.253905 +65c38f1b-d693-453f-8006-8aeae9639884,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-mips-interpreter,30759,20369,51128,1800.226092,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-mips-interpreter,1800.226092,False,0.0,False,1800.226092 +af3b68f1-396c-448a-9dda-8d24dd3648d7,gemini-2.5-flash,gemini,tune-mjcf,6395,6921,13316,338.635574,True,1.0,gemini-2.5-flash,tune-mjcf,338.635574,True,0.6,True,338.635574 +a450bbf0-4497-49ad-a62e-1677a75a99b8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cobol-modernization,18807,15163,33970,918.382574,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cobol-modernization,918.382574,False,0.4,False,918.382574 +582dab3e-c249-4c08-9d3c-bfbf064a057c,grok-code-fast-1,xai,mteb-leaderboard,921,334,1255,146.267777,False,0.0,grok-code-fast-1,mteb-leaderboard,146.267777,False,0.0,False,146.267777 +49a77aef-0dce-4d98-83c8-9784f2699048,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-klee-minimal,16994,2846,19840,906.862312,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-klee-minimal,906.862312,False,0.0,False,906.862312 +5f8f119c-e667-4b12-84ca-2c15188bddd0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,break-filter-js-from-html,2642,2643,5285,337.005894,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,break-filter-js-from-html,337.005894,False,0.0,False,337.005894 +a968c80e-1797-4174-bfd4-ce0f986e1747,moonshotai/Kimi-K2-Instruct-0905,together_ai,code-from-image,6742,2823,9565,124.129238,True,1.0,moonshotai/Kimi-K2-Instruct-0905,code-from-image,124.129238,True,0.6,True,124.129238 +e53aec63-bc73-4458-b831-2633666456bb,gemini-2.5-flash,gemini,sqlite-with-gcov,1388,1212,2600,83.353124,False,0.0,gemini-2.5-flash,sqlite-with-gcov,83.353124,False,0.2,False,83.353124 +10d323a3-9f96-4154-84df-6e09898863ea,claude-opus-4-1-20250805,anthropic,cancel-async-tasks,4958,3067,8025,270.692221,False,0.0,claude-opus-4-1-20250805,cancel-async-tasks,270.692221,False,0.125,False,270.692221 +c0c7c72e-0298-4ec4-ad93-39631f1befb0,openai/gpt-oss-120b,together_ai,mteb-leaderboard,1177,1021,2198,101.789268,False,0.0,openai/gpt-oss-120b,mteb-leaderboard,101.789268,False,0.0,False,101.789268 +71797a23-2aa0-4128-b87e-65488427ac58,gpt-5,openai,constraints-scheduling,4653,3617,8270,268.954183,True,1.0,gpt-5,constraints-scheduling,268.954183,True,0.8571428571428571,True,268.954183 +f9f8216f-5f56-4763-a81a-c484b33fe3dd,grok-4-0709,xai,filter-js-from-html,1620,2177,3797,737.144572,False,0.0,grok-4-0709,filter-js-from-html,737.144572,False,0.0,False,737.144572 +b0d2d742-b0f4-442e-911b-6f133cb25a14,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pmars,5290,1215,6505,2011.660821,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-pmars,2011.660821,False,0.8,False,2011.660821 +9ac272c7-b675-438c-9fb0-0fb33578266b,claude-opus-4-1-20250805,anthropic,password-recovery,6867,5556,12423,907.853543,False,0.0,claude-opus-4-1-20250805,password-recovery,907.853543,False,0.5555555555555556,False,907.853543 +7a11441a-7a42-44d6-97b0-6b5bf8945f57,gpt-5,openai,financial-document-processor,9378,6381,15759,465.008393,False,0.0,gpt-5,financial-document-processor,465.008393,False,0.0,False,465.008393 +7ce97d43-01cf-4953-b4c4-1b74a5c0bc71,gpt-5-mini,openai,winning-avg-corewars,9050,6178,15228,3889.13686,False,0.0,gpt-5-mini,winning-avg-corewars,3889.13686,False,0.0,False,3889.13686 +47c4d818-7cca-4860-bc47-03c7f590d6b5,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,merge-diff-arc-agi-task,11036,5126,16162,912.495621,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,merge-diff-arc-agi-task,912.495621,False,0.4,False,912.495621 +a081fdee-435a-4ded-860c-52600dee3e96,grok-code-fast-1,xai,password-recovery,6323,2635,8958,725.064546,False,0.0,grok-code-fast-1,password-recovery,725.064546,False,0.0,False,725.064546 +e15e2e63-0492-4377-b33c-a935e1cbb7ab,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-cli,4460,1959,6419,196.332793,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-cli,196.332793,False,0.0,False,196.332793 +881f9246-490c-428a-92f6-8099e0aab85c,deepseek-ai/DeepSeek-V3.1,together_ai,build-cython-ext,13609,3490,17099,900.421584,False,0.0,deepseek-ai/DeepSeek-V3.1,build-cython-ext,900.421584,False,0.0,False,900.421584 +626b6e8a-404a-4037-8682-ac85fa08d911,deepseek-ai/DeepSeek-V3.1,together_ai,pypi-server,3659,2219,5878,923.342997,False,0.0,deepseek-ai/DeepSeek-V3.1,pypi-server,923.342997,False,0.4,False,923.342997 +0e457e46-8c98-4bb5-b194-afdf0341ec38,gpt-5-nano,openai,install-windows-3.11,12994,29473,42467,3603.047322,False,0.0,gpt-5-nano,install-windows-3.11,3603.047322,False,0.0,False,3603.047322 +10209b2d-f3cd-4972-a053-f2fbcf36b593,zai-org/GLM-4.5-Air-FP8,together_ai,gpt2-codegolf,2801,3347,6148,168.904017,False,0.0,zai-org/GLM-4.5-Air-FP8,gpt2-codegolf,168.904017,False,0.0,False,168.904017 +75d55ff2-8385-41a2-9b13-8a4bd3202062,claude-sonnet-4-20250514,anthropic,gpt2-codegolf,12115,10747,22862,652.226257,False,0.0,claude-sonnet-4-20250514,gpt2-codegolf,652.226257,False,0.0,False,652.226257 +b709b08b-42aa-4bbe-b473-a201174d501b,openai/gpt-oss-120b,together_ai,build-initramfs-qemu,1365,976,2341,187.639593,False,0.0,openai/gpt-oss-120b,build-initramfs-qemu,187.639593,False,0.0,False,187.639593 +fd2b6ce1-0aa5-4571-b797-2598558a0832,claude-opus-4-1-20250805,anthropic,sanitize-git-repo,8260,2184,10444,1318.237121,False,0.0,claude-opus-4-1-20250805,sanitize-git-repo,1318.237121,False,0.0,False,1318.237121 +648aceaf-ba05-44b2-bc7a-e02573892ee4,OpenAI/gpt-oss-20B,together_ai,distribution-search,191,968,1159,101.232021,False,0.0,OpenAI/gpt-oss-20B,distribution-search,101.232021,False,0.0,False,101.232021 +efabd1eb-d108-4305-b8c1-ff9c54aca96c,gpt-5-nano,openai,torch-tensor-parallelism,2406,2420,4826,174.734081,False,0.0,gpt-5-nano,torch-tensor-parallelism,174.734081,False,0.0,False,174.734081 +74c6cc0c-f59c-436b-adbb-4c1781960e95,gpt-5-mini,openai,fix-ocaml-gc,35485,31544,67029,3602.311654,False,0.0,gpt-5-mini,fix-ocaml-gc,3602.311654,False,0.0,False,3602.311654 +9d16e901-6dc8-43ba-9b8c-a897c998ce5b,openai/gpt-oss-120b,together_ai,path-tracing,3289,2355,5644,160.948016,False,0.0,openai/gpt-oss-120b,path-tracing,160.948016,False,0.0,False,160.948016 +d8a56aba-4c25-4f56-af23-d1e7180d9ff1,openai/gpt-oss-120b,together_ai,log-summary-date-ranges,1849,949,2798,24.000834,False,0.0,openai/gpt-oss-120b,log-summary-date-ranges,24.000834,False,0.0,False,24.000834 +ec706b11-1e87-48ba-93aa-72ab7fb00467,grok-code-fast-1,xai,largest-eigenval,7261,5071,12332,900.198927,False,0.0,grok-code-fast-1,largest-eigenval,900.198927,False,0.0,False,900.198927 +841cb7ef-442e-440b-971d-2ceb424ef6fa,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sanitize-git-repo,11114,3526,14640,338.235869,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sanitize-git-repo,338.235869,False,0.0,False,338.235869 +4503f9c5-63a6-4e2a-b04e-6250752b491f,openai/gpt-oss-120b,together_ai,mteb-retrieve,1811,747,2558,123.541305,False,0.0,openai/gpt-oss-120b,mteb-retrieve,123.541305,False,0.0,False,123.541305 +3efbef34-1841-4433-be94-a61b3662bc3a,claude-sonnet-4-20250514,anthropic,crack-7z-hash,10338,4326,14664,488.225367,True,1.0,claude-sonnet-4-20250514,crack-7z-hash,488.225367,True,1.0,True,488.225367 +da7071eb-7ea6-4e09-84e8-f6172fdd7a44,gpt-5-nano,openai,train-fasttext,17252,11546,28798,3606.066432,False,0.0,gpt-5-nano,train-fasttext,3606.066432,False,0.0,False,3606.066432 +958caf74-cf6f-4618-99d3-e62e7fe3c368,gpt-5-mini,openai,pypi-server,3368,1494,4862,159.632302,False,0.0,gpt-5-mini,pypi-server,159.632302,False,0.8,False,159.632302 +98225b59-8672-4294-acde-adecde6f1714,gpt-5-mini,openai,install-windows-3.11,4493,2378,6871,1116.303841,False,0.0,gpt-5-mini,install-windows-3.11,1116.303841,False,0.0,False,1116.303841 +ba168e96-63f1-4d45-8f31-f41704d52b2b,gpt-5-nano,openai,train-fasttext,24326,28913,53239,3603.687584,False,0.0,gpt-5-nano,train-fasttext,3603.687584,False,0.0,False,3603.687584 +d71d756f-35c9-4f9f-99a4-f17d2dc0ccd6,claude-sonnet-4-20250514,anthropic,dna-assembly,12027,7966,19993,720.023391,False,0.0,claude-sonnet-4-20250514,dna-assembly,720.023391,False,0.0,False,720.023391 +fc085ff4-1ecf-4dd6-bdc6-a537e278afda,claude-sonnet-4-20250514,anthropic,cancel-async-tasks,2093,1453,3546,160.756635,True,1.0,claude-sonnet-4-20250514,cancel-async-tasks,160.756635,True,0.8,True,160.756635 +aa0a7438-d92e-4c60-b9ce-8cb13d7cfa0d,openai/gpt-oss-120b,together_ai,cobol-modernization,4628,3614,8242,880.826442,True,1.0,openai/gpt-oss-120b,cobol-modernization,880.826442,True,0.8,True,880.826442 +9723b5f3-2249-4834-8d7e-4e4e6afe7cc3,openai/gpt-oss-120b,together_ai,path-tracing,4143,7075,11218,990.240518,False,0.0,openai/gpt-oss-120b,path-tracing,990.240518,False,0.0,False,990.240518 +cb02b4ad-c656-434a-a32f-fca3e475be87,grok-code-fast-1,xai,make-mips-interpreter,16992,10490,27482,783.100446,False,0.0,grok-code-fast-1,make-mips-interpreter,783.100446,False,0.0,False,783.100446 +0da3030f-abda-4a61-a575-ff94f85b833a,gemini-2.5-flash,gemini,wasm-pipeline,8057,3986,12043,883.290468,False,0.0,gemini-2.5-flash,wasm-pipeline,883.290468,False,0.4,False,883.290468 +d4cb8f39-4bdd-4041-b050-b84e1a24326a,gpt-5-nano,openai,reshard-c4-data,6234,5415,11649,341.528637,False,0.0,gpt-5-nano,reshard-c4-data,341.528637,False,0.0,False,341.528637 +1c7e74ed-9c6a-48f6-b3f6-6ee6c40af43f,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing-reverse,42276,10269,52545,926.290808,False,0.0,deepseek-ai/DeepSeek-V3.1,path-tracing-reverse,926.290808,False,0.2,False,926.290808 +62525c68-1e86-4fdb-ba64-af72b9852e38,gpt-5-nano,openai,qemu-startup,6835,8501,15336,903.429558,False,0.0,gpt-5-nano,qemu-startup,903.429558,False,0.0,False,903.429558 +a4493ced-0ed1-4aa5-8299-5e3459fc8484,claude-opus-4-1-20250805,anthropic,path-tracing-reverse,39551,31467,71018,1800.000917,False,0.0,claude-opus-4-1-20250805,path-tracing-reverse,1800.000917,False,0.0,False,1800.000917 +a28c0ba5-3b17-4d8c-841d-5e2894c05fe0,gemini-2.5-pro,gemini,circuit-fibsqrt,57463,69238,126701,3607.193816,False,0.0,gemini-2.5-pro,circuit-fibsqrt,3607.193816,False,0.0,False,3607.193816 +5ac1cc5d-2751-4eae-a5d9-96a4da87c5c4,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-insert,10950,4120,15070,417.386783,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-insert,417.386783,False,0.0,False,417.386783 +6955d6e1-c4ad-47c0-81c7-dbe45c22c211,openai/gpt-oss-120b,together_ai,make-mips-interpreter,16205,11287,27492,1815.799916,False,0.0,openai/gpt-oss-120b,make-mips-interpreter,1815.799916,False,0.0,False,1815.799916 +9946fe4b-1f16-4b2a-869c-67978b1ce6e7,deepseek-ai/DeepSeek-V3.1,together_ai,break-filter-js-from-html,7914,10746,18660,1222.818287,False,0.0,deepseek-ai/DeepSeek-V3.1,break-filter-js-from-html,1222.818287,False,0.0,False,1222.818287 +c5869034-8b6b-4712-8cdb-41fe3f395368,zai-org/GLM-4.5-Air-FP8,together_ai,fix-ocaml-gc,55868,27713,83581,1609.463975,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-ocaml-gc,1609.463975,False,0.0,False,1609.463975 +55dadd19-ba2b-4f0a-94cb-ba498bcf2bfa,OpenAI/gpt-oss-20B,together_ai,dna-insert,1197,3125,4322,422.784881,False,0.0,OpenAI/gpt-oss-20B,dna-insert,422.784881,False,0.0,False,422.784881 +68bd8595-ef59-451f-938f-e0f035b8144a,openai/gpt-oss-120b,together_ai,merge-diff-arc-agi-task,10704,10592,21296,912.786288,False,0.0,openai/gpt-oss-120b,merge-diff-arc-agi-task,912.786288,False,0.0,False,912.786288 +747cd308-e681-451a-91ff-fdf0271a8366,openai/gpt-oss-120b,together_ai,largest-eigenval,7349,7672,15021,900.036554,False,0.0,openai/gpt-oss-120b,largest-eigenval,900.036554,False,0.0,False,900.036554 +e55a994f-114e-4324-8723-89dbf1dd0762,openai/gpt-oss-120b,together_ai,code-from-image,21392,13871,35263,1220.886275,False,0.0,openai/gpt-oss-120b,code-from-image,1220.886275,False,0.0,False,1220.886275 +b3255bde-5951-4e8d-bdb9-6f49db75e659,claude-sonnet-4-20250514,anthropic,pytorch-model-cli,10577,6504,17081,519.731355,False,0.0,claude-sonnet-4-20250514,pytorch-model-cli,519.731355,False,0.4,False,519.731355 +c31cfdd1-602e-4a34-b8e8-822820d3e96e,gemini-2.5-flash,gemini,financial-document-processor,4704,3293,7997,129.254561,False,0.0,gemini-2.5-flash,financial-document-processor,129.254561,False,0.0,False,129.254561 +f1755a39-6fc2-48d5-83db-ee773c79f222,gpt-5,openai,install-klee-minimal,1732,1910,3642,900.000697,False,0.0,gpt-5,install-klee-minimal,900.000697,False,0.0,False,900.000697 +53f8669f-7fe2-4244-af21-4aafe08a6e0a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,model-extraction-relu-logits,8640,7194,15834,816.844789,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,model-extraction-relu-logits,816.844789,False,0.0,False,816.844789 +1ebdd63c-1eaa-495d-9f3a-1db36cea5b62,gpt-5,openai,password-recovery,8991,8590,17581,907.806038,False,0.0,gpt-5,password-recovery,907.806038,False,0.0,False,907.806038 +675d9cff-07e9-4229-8683-ac5672b88e93,grok-4-0709,xai,model-extraction-relu-logits,2845,2837,5682,900.479796,False,0.0,grok-4-0709,model-extraction-relu-logits,900.479796,False,0.0,False,900.479796 +b5caf698-964c-484d-a268-a635553496c1,zai-org/GLM-4.5-Air-FP8,together_ai,build-pov-ray,16890,7872,24762,857.452523,False,0.0,zai-org/GLM-4.5-Air-FP8,build-pov-ray,857.452523,False,0.0,False,857.452523 +2526fb6a-159a-4109-9b29-394ab7adbed5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-linear-cryptanalysis,6408,2965,9373,647.888643,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-linear-cryptanalysis,647.888643,False,0.0,False,647.888643 +25d527b3-f5fa-42b7-bb01-73df19023097,gemini-2.5-pro,gemini,torch-tensor-parallelism,1880,1149,3029,91.635433,False,0.0,gemini-2.5-pro,torch-tensor-parallelism,91.635433,False,0.0,False,91.635433 +70f41658-a133-40d4-bfdc-b98565172e7a,grok-4-0709,xai,path-tracing-reverse,3433,3997,7430,1802.345362,False,0.0,grok-4-0709,path-tracing-reverse,1802.345362,False,0.0,False,1802.345362 +7952c808-a1db-4615-abcc-af01073c3d7d,gpt-5-mini,openai,schemelike-metacircular-eval,25386,25123,50509,2400.032071,False,0.0,gpt-5-mini,schemelike-metacircular-eval,2400.032071,False,0.0,False,2400.032071 +58cc3941-88a0-455e-9ffe-4a0e05525d85,grok-4-0709,xai,run-pdp11-code,5792,1958,7750,1002.790046,False,0.0,grok-4-0709,run-pdp11-code,1002.790046,False,0.0,False,1002.790046 +899c39df-0934-409f-bef2-82c3a3f6cf5d,gpt-5,openai,make-mips-interpreter,26574,35512,62086,1800.00051,False,0.0,gpt-5,make-mips-interpreter,1800.00051,False,0.0,False,1800.00051 +7b56cb74-5bd8-4174-a21c-46d1db75dc75,OpenAI/gpt-oss-20B,together_ai,install-windows-3.11,1028,3527,4555,243.355714,False,0.0,OpenAI/gpt-oss-20B,install-windows-3.11,243.355714,False,0.0,False,243.355714 +c833fd31-f4be-4e47-9252-d13aa3acca2b,gpt-5,openai,circuit-fibsqrt,24334,25502,49836,2806.007752,True,1.0,gpt-5,circuit-fibsqrt,2806.007752,True,0.6666666666666666,True,2806.007752 +c3ed9aa9-f28c-4821-a5f0-60a121704ce1,gpt-5,openai,large-scale-text-editing,3058,2247,5305,370.535239,True,1.0,gpt-5,large-scale-text-editing,370.535239,True,0.4285714285714285,True,370.535239 +e19c5765-2c2d-4888-81bb-a1847ec6161a,claude-sonnet-4-20250514,anthropic,log-summary-date-ranges,11416,7211,18627,905.872455,True,1.0,claude-sonnet-4-20250514,log-summary-date-ranges,905.872455,True,1.0,True,905.872455 +71b785c4-06af-44f2-9150-00a8a6e10302,gemini-2.5-pro,gemini,break-filter-js-from-html,2034,1542,3576,182.090463,False,0.0,gemini-2.5-pro,break-filter-js-from-html,182.090463,False,0.2,False,182.090463 +f5fc4ce5-180d-4f1d-b0c2-07a7f72bc30f,OpenAI/gpt-oss-20B,together_ai,constraints-scheduling,231,397,628,74.12003,False,0.0,OpenAI/gpt-oss-20B,constraints-scheduling,74.12003,False,0.2,False,74.12003 +bfb7ed66-7436-4b27-bd32-e7b979be28c0,OpenAI/gpt-oss-20B,together_ai,break-filter-js-from-html,1161,2933,4094,65.606627,False,0.0,OpenAI/gpt-oss-20B,break-filter-js-from-html,65.606627,False,0.0,False,65.606627 +209a3ce1-a607-4779-8105-5a2a8f03f55d,gemini-2.5-flash,gemini,install-windows-3.11,1956,1075,3031,113.706274,False,0.0,gemini-2.5-flash,install-windows-3.11,113.706274,False,0.0,False,113.706274 +1441e536-a7ae-4ecc-8615-151b96d24b7f,grok-code-fast-1,xai,video-processing,2169,1592,3761,182.58662,False,0.0,grok-code-fast-1,video-processing,182.58662,False,0.0,False,182.58662 +e144c3ee-6855-4f5b-ba63-d5d340cecfdc,gpt-5-nano,openai,port-compressor,14581,19777,34358,3611.691835,False,0.0,gpt-5-nano,port-compressor,3611.691835,False,0.0,False,3611.691835 +161a3789-cf56-4335-9996-f0bb26832b7a,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-klee-minimal,14979,2866,17845,904.157665,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-klee-minimal,904.157665,False,0.0,False,904.157665 +9c234dc1-abf2-4cbc-9014-3c82cbb2c0b2,zai-org/GLM-4.5-Air-FP8,together_ai,prove-plus-comm,4674,6618,11292,517.126616,True,1.0,zai-org/GLM-4.5-Air-FP8,prove-plus-comm,517.126616,True,0.8,True,517.126616 +12db81e6-9e97-4a1e-94b4-c2a458b48a84,claude-sonnet-4-20250514,anthropic,schemelike-metacircular-eval,28608,26671,55279,2400.626329,False,0.0,claude-sonnet-4-20250514,schemelike-metacircular-eval,2400.626329,False,0.0,False,2400.626329 +4a773c2d-70aa-42cb-a1d4-e39de686e077,claude-opus-4-1-20250805,anthropic,hf-model-inference,3707,2878,6585,578.428453,False,0.0,claude-opus-4-1-20250805,hf-model-inference,578.428453,False,0.25,False,578.428453 +b49e398c-2fc2-473e-8937-2b3876543994,claude-opus-4-1-20250805,anthropic,circuit-fibsqrt,56606,62563,119169,3605.205582,False,0.0,claude-opus-4-1-20250805,circuit-fibsqrt,3605.205582,False,0.0,False,3605.205582 +ab827028-5277-457f-a17e-f2346fe6297d,claude-opus-4-1-20250805,anthropic,hf-model-inference,4291,3270,7561,412.360843,False,0.0,claude-opus-4-1-20250805,hf-model-inference,412.360843,False,0.25,False,412.360843 +e4bcdc8f-fc92-4aa9-b6fc-23f4e4f6c565,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing-reverse,19308,15371,34679,1840.649835,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing-reverse,1840.649835,False,0.0,False,1840.649835 +49e9a6df-bb66-4748-802c-90236c2b0431,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-alpine-ssh,1596,1333,2929,181.289747,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-alpine-ssh,181.289747,False,0.0,False,181.289747 +61d5f61b-b128-4458-a7ec-7feb734a3ecb,gpt-5-nano,openai,filter-js-from-html,9151,13137,22288,901.618909,False,0.0,gpt-5-nano,filter-js-from-html,901.618909,False,0.0,False,901.618909 +c1f9e8d1-c0c4-4ed5-ab5a-98dea645467c,openai/gpt-oss-120b,together_ai,reverse-engineering,8372,18209,26581,1800.043933,False,0.0,openai/gpt-oss-120b,reverse-engineering,1800.043933,False,0.2,False,1800.043933 +b64c92c0-0961-4d3a-b574-b86bb1274980,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,filter-js-from-html,1819,1330,3149,118.673897,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,filter-js-from-html,118.673897,False,0.0,False,118.673897 +0f0849a5-65df-49c6-b2e3-7fd6c61f8d54,claude-opus-4-1-20250805,anthropic,make-mips-interpreter,31548,30290,61838,1800.001671,False,0.0,claude-opus-4-1-20250805,make-mips-interpreter,1800.001671,False,0.0,False,1800.001671 +679104e1-676c-4505-8748-5e96da2b5f67,OpenAI/gpt-oss-20B,together_ai,dna-assembly,735,1956,2691,227.617005,False,0.0,OpenAI/gpt-oss-20B,dna-assembly,227.617005,False,0.0,False,227.617005 +a3cf9822-dbcd-4023-b781-dc16820f448a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pypi-server,3670,1313,4983,558.133171,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pypi-server,558.133171,False,0.2,False,558.133171 +65d04922-ca6d-482c-a6eb-9763f0936706,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-git,14208,4768,18976,900.035437,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-git,900.035437,False,0.0,False,900.035437 +677b8b59-0e58-41d6-8504-0f75cb8be454,grok-code-fast-1,xai,code-from-image,6296,2820,9116,297.290677,False,0.0,grok-code-fast-1,code-from-image,297.290677,False,0.0,False,297.290677 +32b4a7a5-40d5-4c67-9798-40d5dd4ff4e3,gpt-5,openai,sparql-university,5514,1975,7489,341.788481,False,0.0,gpt-5,sparql-university,341.788481,False,0.8,False,341.788481 +a4aa8ddd-bc91-416c-8bec-f8c8e4c71655,openai/gpt-oss-120b,together_ai,fix-code-vulnerability,8060,6902,14962,900.181918,False,0.0,openai/gpt-oss-120b,fix-code-vulnerability,900.181918,False,0.0,False,900.181918 +bf8b3f74-df47-4f3e-bcf5-1e83ab1abda5,gpt-5,openai,financial-document-processor,7597,8114,15711,1259.580442,False,0.0,gpt-5,financial-document-processor,1259.580442,False,0.0,False,1259.580442 +62f43f2d-b0ba-4951-a283-26a4aa00e494,claude-sonnet-4-20250514,anthropic,fix-git,3826,2643,6469,480.673688,True,1.0,claude-sonnet-4-20250514,fix-git,480.673688,True,1.0,True,480.673688 +b6387e81-c754-4704-a30c-e7013a23b8f3,deepseek-ai/DeepSeek-V3.1,together_ai,nginx-request-logging,4564,1913,6477,420.484928,False,0.0,deepseek-ai/DeepSeek-V3.1,nginx-request-logging,420.484928,False,0.4,False,420.484928 +29d35c51-fe74-4323-afe2-47f6905decc5,claude-opus-4-1-20250805,anthropic,path-tracing-reverse,55978,43344,99322,1800.001767,False,0.0,claude-opus-4-1-20250805,path-tracing-reverse,1800.001767,False,0.0,False,1800.001767 +101f0de8-a65c-40d2-bfef-5c194785c5bb,claude-opus-4-1-20250805,anthropic,feal-differential-cryptanalysis,26970,27378,54348,1800.001205,False,0.0,claude-opus-4-1-20250805,feal-differential-cryptanalysis,1800.001205,False,0.0,False,1800.001205 +bf307024-8734-4d0e-8c24-4acf679c85f4,claude-opus-4-1-20250805,anthropic,install-windows-3.11,7892,2484,10376,177.77918,False,0.0,claude-opus-4-1-20250805,install-windows-3.11,177.77918,False,0.0,False,177.77918 +c5b97de4-2ba6-4e4e-869e-706eca38cb75,deepseek-ai/DeepSeek-V3.1,together_ai,distribution-search,14086,11104,25190,701.194769,False,0.0,deepseek-ai/DeepSeek-V3.1,distribution-search,701.194769,False,0.0,False,701.194769 +9e8a65a4-341a-4191-b20e-b19282e522c3,OpenAI/gpt-oss-20B,together_ai,filter-js-from-html,1270,658,1928,362.813859,False,0.0,OpenAI/gpt-oss-20B,filter-js-from-html,362.813859,False,0.0,False,362.813859 +2be26b05-3333-478c-afe2-b2acdc76c0b1,zai-org/GLM-4.5-Air-FP8,together_ai,adaptive-rejection-sampler,18823,18385,37208,903.037236,False,0.0,zai-org/GLM-4.5-Air-FP8,adaptive-rejection-sampler,903.037236,False,0.0,False,903.037236 +b09962d1-db36-4b8d-94a9-ac2032b0f516,gemini-2.5-pro,gemini,dna-assembly,6974,4061,11035,451.541357,False,0.0,gemini-2.5-pro,dna-assembly,451.541357,False,0.0,False,451.541357 +d6c8edd1-e031-41ed-b4bf-7b808e8ad427,moonshotai/Kimi-K2-Instruct-0905,together_ai,write-compressor,7415,7050,14465,939.934948,False,0.0,moonshotai/Kimi-K2-Instruct-0905,write-compressor,939.934948,False,0.0,False,939.934948 +4e4777b1-039c-4424-b2ac-9ce9766f3318,gpt-5-nano,openai,mteb-leaderboard,33665,53668,87333,3602.432102,False,0.0,gpt-5-nano,mteb-leaderboard,3602.432102,False,0.0,False,3602.432102 +428e829a-0c30-48ec-ad8d-a31fd4be7d49,claude-opus-4-1-20250805,anthropic,count-dataset-tokens,6942,3186,10128,170.811476,False,0.0,claude-opus-4-1-20250805,count-dataset-tokens,170.811476,False,0.0,False,170.811476 +5b0aa2fc-0690-4264-a5cc-c6765b323c32,gpt-5-mini,openai,winning-avg-corewars,13640,12243,25883,3624.57897,False,0.0,gpt-5-mini,winning-avg-corewars,3624.57897,False,0.0,False,3624.57897 +22df531f-bf24-4f6d-bc7b-b010873ab465,gemini-2.5-flash,gemini,build-initramfs-qemu,5714,10157,15871,902.21007,False,0.0,gemini-2.5-flash,build-initramfs-qemu,902.21007,False,0.0,False,902.21007 +bbcf0ba5-3373-4084-9473-1af7971155d4,gemini-2.5-flash,gemini,code-from-image,6017,2394,8411,175.876213,True,1.0,gemini-2.5-flash,code-from-image,175.876213,True,0.4,True,175.876213 +acb1d3a5-023a-45da-90a6-3f0d90adf5cf,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-c-py,12849,12360,25209,901.780684,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-c-py,901.780684,False,0.0,False,901.780684 +d68797a9-d08b-4030-b2ee-2ff60b01fe06,gpt-5-nano,openai,financial-document-processor,22417,15297,37714,1200.602162,False,0.0,gpt-5-nano,financial-document-processor,1200.602162,False,0.0,False,1200.602162 +81b85d40-cdde-40be-93cb-d604afde25f9,gpt-5-nano,openai,circuit-fibsqrt,4100,4528,8628,294.273455,False,0.0,gpt-5-nano,circuit-fibsqrt,294.273455,False,0.0,False,294.273455 +02a750d9-a393-4f5d-a578-29d0f56611df,gemini-2.5-flash,gemini,build-pov-ray,99115,79373,178488,5622.761483,False,0.0,gemini-2.5-flash,build-pov-ray,5622.761483,False,0.0,False,5622.761483 +aadfbb61-677b-40af-a7d3-5147a44aecf7,claude-opus-4-1-20250805,anthropic,filter-js-from-html,11405,9198,20603,244.716243,False,0.0,claude-opus-4-1-20250805,filter-js-from-html,244.716243,False,0.0,False,244.716243 +897b72b3-14fc-4e17-98cd-dc940b49d36f,gpt-5-mini,openai,gpt2-codegolf,2061,2372,4433,436.186051,False,0.0,gpt-5-mini,gpt2-codegolf,436.186051,False,0.0,False,436.186051 +fa2775ea-3e28-4a68-ba8b-6e0ef3ac5d87,gpt-5,openai,fix-git,4935,1942,6877,435.026853,True,1.0,gpt-5,fix-git,435.026853,True,1.0,True,435.026853 +58c69ea6-265a-459c-a770-dca1ef81a615,claude-sonnet-4-20250514,anthropic,bn-fit-modify,18997,8728,27725,820.136814,True,1.0,claude-sonnet-4-20250514,bn-fit-modify,820.136814,True,0.8,True,820.136814 +a6547ec3-3f6d-4bcc-b07c-9355a18c0c33,claude-opus-4-1-20250805,anthropic,financial-document-processor,10674,3906,14580,409.223505,False,0.0,claude-opus-4-1-20250805,financial-document-processor,409.223505,False,0.0,False,409.223505 +6c3e5b9f-0193-4fea-9098-c4f01174cc73,openai/gpt-oss-120b,together_ai,fix-code-vulnerability,13149,8376,21525,511.118547,False,0.0,openai/gpt-oss-120b,fix-code-vulnerability,511.118547,False,0.0,False,511.118547 +94371db0-b28b-4a7a-83b1-cfb47a74370b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,break-filter-js-from-html,3420,3557,6977,270.436057,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,break-filter-js-from-html,270.436057,False,0.0,False,270.436057 +14d3f843-9db3-4ee6-a8e6-68a12e6153fa,deepseek-ai/DeepSeek-V3.1,together_ai,build-pov-ray,20767,6801,27568,1001.618871,False,0.0,deepseek-ai/DeepSeek-V3.1,build-pov-ray,1001.618871,False,0.4,False,1001.618871 +1fa20ee9-325e-46c4-b090-22368e10c9b2,claude-opus-4-1-20250805,anthropic,bn-fit-modify,15015,7176,22191,556.406186,False,0.0,claude-opus-4-1-20250805,bn-fit-modify,556.406186,False,0.875,False,556.406186 +14e4c0e1-444e-49ef-8c94-0fca269d1437,gpt-5,openai,distribution-search,5185,4625,9810,608.0784,True,1.0,gpt-5,distribution-search,608.0784,True,1.0,True,608.0784 +ddf1e92e-9eba-4f78-ae68-f1884650d3e2,openai/gpt-oss-120b,together_ai,dna-assembly,10653,2894,13547,187.498913,False,0.0,openai/gpt-oss-120b,dna-assembly,187.498913,False,0.0,False,187.498913 +574c6244-981c-4f31-8029-f42e33a8f24c,gpt-5,openai,mteb-retrieve,2102,1041,3143,276.970491,False,0.0,gpt-5,mteb-retrieve,276.970491,False,0.0,False,276.970491 +a3204fe4-ff67-4c04-b964-451940607141,gpt-5-nano,openai,configure-git-webserver,5902,2657,8559,900.73465,False,0.0,gpt-5-nano,configure-git-webserver,900.73465,False,0.2,False,900.73465 +4494df2c-3164-4d38-82e4-efe499bf9d84,moonshotai/Kimi-K2-Instruct-0905,together_ai,form-filling,7062,5142,12204,397.287931,False,0.0,moonshotai/Kimi-K2-Instruct-0905,form-filling,397.287931,False,0.8,False,397.287931 +f242a9ae-cc73-4911-8070-8cf8c815d9eb,gpt-5,openai,sanitize-git-repo,4761,5506,10267,1323.975506,False,0.0,gpt-5,sanitize-git-repo,1323.975506,False,0.2857142857142857,False,1323.975506 +e90fcddf-fe64-4f44-b12e-d9e9cfd3f3ff,gpt-5-nano,openai,make-doom-for-mips,11419,7808,19227,901.505165,False,0.0,gpt-5-nano,make-doom-for-mips,901.505165,False,0.0,False,901.505165 +25626d83-ea6e-455d-ae88-70deb2dccd90,claude-sonnet-4-20250514,anthropic,filter-js-from-html,8990,7857,16847,515.436418,False,0.0,claude-sonnet-4-20250514,filter-js-from-html,515.436418,False,0.0,False,515.436418 +193e3363-8b25-4836-b7c3-863aa886a4f2,grok-code-fast-1,xai,cobol-modernization,3715,1882,5597,105.695752,True,1.0,grok-code-fast-1,cobol-modernization,105.695752,True,0.6,True,105.695752 +1da3c988-7d59-4bd8-a49a-6b9381d56684,gpt-5-mini,openai,polyglot-rust-c,7138,5688,12826,906.995784,False,0.0,gpt-5-mini,polyglot-rust-c,906.995784,False,0.0,False,906.995784 +f97dc390-b7ba-4935-bf82-f79e02d159dd,grok-4-0709,xai,vulnerable-secret,6637,3559,10196,841.34485,True,1.0,grok-4-0709,vulnerable-secret,841.34485,True,0.6,True,841.34485 +dd29edfb-f115-42ca-b42d-655ebf73d59d,deepseek-ai/DeepSeek-V3.1,together_ai,pypi-server,7527,3943,11470,438.034544,False,0.0,deepseek-ai/DeepSeek-V3.1,pypi-server,438.034544,False,0.4,False,438.034544 +1e4f776b-7524-44f2-b9e0-a5be702eeb72,zai-org/GLM-4.5-Air-FP8,together_ai,install-windows-3.11,6396,3585,9981,352.388501,False,0.0,zai-org/GLM-4.5-Air-FP8,install-windows-3.11,352.388501,False,0.0,False,352.388501 +5b597738-727e-4aa6-9030-1cfb8f8b2ac2,gemini-2.5-pro,gemini,form-filling,6081,4820,10901,223.876052,True,1.0,gemini-2.5-pro,form-filling,223.876052,True,0.2,True,223.876052 +51ea6191-fce2-412a-97c5-eeaefe0c14aa,moonshotai/Kimi-K2-Instruct-0905,together_ai,reshard-c4-data,7975,5697,13672,518.070317,False,0.0,moonshotai/Kimi-K2-Instruct-0905,reshard-c4-data,518.070317,False,0.0,False,518.070317 +4fbefe11-44f5-42ce-b8ca-7b64d20697f1,deepseek-ai/DeepSeek-V3.1,together_ai,build-pmars,12318,2695,15013,364.590255,True,1.0,deepseek-ai/DeepSeek-V3.1,build-pmars,364.590255,True,1.0,True,364.590255 +8d2939e5-cb1f-4ee9-a00d-1e5dd56d39f1,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-windows-3.11,7489,2882,10371,1203.25457,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-windows-3.11,1203.25457,False,0.0,False,1203.25457 +4781e186-090c-4f11-9287-aa75f1b12340,gpt-5-mini,openai,train-fasttext,18158,19333,37491,3606.12247,False,0.0,gpt-5-mini,train-fasttext,3606.12247,False,0.0,False,3606.12247 +8a533501-ab8e-4a53-a5f1-e7fe1b65f2f6,zai-org/GLM-4.5-Air-FP8,together_ai,financial-document-processor,9612,4239,13851,1202.196976,False,0.0,zai-org/GLM-4.5-Air-FP8,financial-document-processor,1202.196976,False,0.0,False,1202.196976 +cf605add-f801-44c7-824b-2e7de38ba337,openai/gpt-oss-120b,together_ai,circuit-fibsqrt,10902,13390,24292,1155.87658,False,0.0,openai/gpt-oss-120b,circuit-fibsqrt,1155.87658,False,0.0,False,1155.87658 +53b91d78-bd4c-402c-a2d6-498aafbf5b5d,openai/gpt-oss-120b,together_ai,wasm-pipeline,1530,852,2382,34.906796,False,0.0,openai/gpt-oss-120b,wasm-pipeline,34.906796,False,0.0,False,34.906796 +7dd3ba78-b646-4866-9d33-eb328d23c223,grok-code-fast-1,xai,path-tracing,3543,2545,6088,353.434563,False,0.0,grok-code-fast-1,path-tracing,353.434563,False,0.0,False,353.434563 +96ccc7b3-5ebd-4602-85f6-930b024e1a7b,gemini-2.5-pro,gemini,extract-elf,9672,5994,15666,900.276668,False,0.0,gemini-2.5-pro,extract-elf,900.276668,False,0.0,False,900.276668 +d8f3a31b-8117-448b-b3a2-76d6af2bdcd7,openai/gpt-oss-120b,together_ai,large-scale-text-editing,5681,10594,16275,1212.308338,False,0.0,openai/gpt-oss-120b,large-scale-text-editing,1212.308338,False,0.0,False,1212.308338 +c16559a9-59ee-481d-b510-788461242ac5,gpt-5-nano,openai,gpt2-codegolf,4566,7636,12202,900.018413,False,0.0,gpt-5-nano,gpt2-codegolf,900.018413,False,0.0,False,900.018413 +41a0673e-5b36-478a-8531-e20d17c277e3,gpt-5-nano,openai,dna-assembly,10546,11378,21924,777.270451,False,0.0,gpt-5-nano,dna-assembly,777.270451,False,0.0,False,777.270451 +ec1afa10-40ef-4ae0-a918-f4dc7680160e,gemini-2.5-pro,gemini,extract-elf,12265,3731,15996,825.739477,False,0.0,gemini-2.5-pro,extract-elf,825.739477,False,0.0,False,825.739477 +1dcdb912-1680-451e-a8e1-0eb3a19eb1a3,openai/gpt-oss-120b,together_ai,circuit-fibsqrt,8229,30199,38428,3624.499176,False,0.0,openai/gpt-oss-120b,circuit-fibsqrt,3624.499176,False,0.0,False,3624.499176 +692df3a5-85b6-40f2-be8c-52c4deb85f96,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-doom-for-mips,17726,3901,21627,793.212135,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-doom-for-mips,793.212135,False,0.0,False,793.212135 +ee79d8b8-2b25-44e9-954a-aedb7a87a556,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,filter-js-from-html,3299,3304,6603,562.278109,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,filter-js-from-html,562.278109,False,0.0,False,562.278109 +2a260166-61f0-4fce-b463-4ff9e962dfc6,gpt-5,openai,form-filling,11309,12743,24052,568.057126,True,1.0,gpt-5,form-filling,568.057126,True,0.8,True,568.057126 +f159c79d-2470-48aa-8a61-edcd0f7b70c4,claude-opus-4-1-20250805,anthropic,configure-git-webserver,5968,1726,7694,83.241783,False,0.0,claude-opus-4-1-20250805,configure-git-webserver,83.241783,False,0.625,False,83.241783 +d7f9cdc8-9a63-489b-9a66-ff574eba5cb2,grok-code-fast-1,xai,reshard-c4-data,3501,2979,6480,1012.044011,False,0.0,grok-code-fast-1,reshard-c4-data,1012.044011,False,0.0,False,1012.044011 +2a24d1d9-fb85-4f44-a37a-12d2a790692b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-cython-ext,18355,3880,22235,323.427828,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-cython-ext,323.427828,False,0.0,False,323.427828 +732b8070-0731-495f-9fce-82a99731db16,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing,17251,15461,32712,1181.13938,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing,1181.13938,False,0.0,False,1181.13938 +8853c917-ff48-4149-aca0-95a2a327bd4b,grok-code-fast-1,xai,configure-git-webserver,4532,927,5459,266.269946,False,0.0,grok-code-fast-1,configure-git-webserver,266.269946,False,0.0,False,266.269946 +13462627-1abe-46f7-b809-0fe5957216fb,gemini-2.5-flash,gemini,qemu-alpine-ssh,2008,2008,4016,193.816308,False,0.0,gemini-2.5-flash,qemu-alpine-ssh,193.816308,False,0.0,False,193.816308 +49bebc3d-28e1-48d2-8d08-f023fb44d323,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-rust-c,3177,2496,5673,301.09723,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-rust-c,301.09723,False,0.0,False,301.09723 +042787c0-52d6-4d41-9140-bb0dac2b803e,claude-sonnet-4-20250514,anthropic,pytorch-model-recovery,13916,7635,21551,574.999406,True,1.0,claude-sonnet-4-20250514,pytorch-model-recovery,574.999406,True,1.0,True,574.999406 +b26ca7ce-077f-40ab-8184-f7941fe9004c,OpenAI/gpt-oss-20B,together_ai,make-doom-for-mips,2029,5676,7705,908.142126,False,0.0,OpenAI/gpt-oss-20B,make-doom-for-mips,908.142126,False,0.0,False,908.142126 +2aed27f3-8026-448e-94dd-e21e7fbd3957,gemini-2.5-pro,gemini,bn-fit-modify,29250,15409,44659,1886.47887,False,0.0,gemini-2.5-pro,bn-fit-modify,1886.47887,False,0.0,False,1886.47887 +3da3b6c0-a617-47e0-816d-6715ad7d210d,grok-4-0709,xai,distribution-search,1747,1359,3106,721.909356,False,0.0,grok-4-0709,distribution-search,721.909356,False,0.4,False,721.909356 +56279176-9b1b-41e9-acf8-d2b77ff99f16,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-startup,2169,1889,4058,228.085108,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-startup,228.085108,False,0.4,False,228.085108 +da970dac-9368-40b3-bbaa-e2dc89d5f103,claude-sonnet-4-20250514,anthropic,qemu-alpine-ssh,2752,3985,6737,646.304485,True,1.0,claude-sonnet-4-20250514,qemu-alpine-ssh,646.304485,True,0.6,True,646.304485 +fc1eccda-d40b-4ece-b7ea-dcd03d3bbeed,gpt-5,openai,write-compressor,4300,6968,11268,893.131821,False,0.0,gpt-5,write-compressor,893.131821,False,0.3333333333333333,False,893.131821 +61050336-bb24-4ee8-94de-ce9fe730b482,moonshotai/Kimi-K2-Instruct-0905,together_ai,log-summary-date-ranges,7511,2217,9728,410.260485,True,1.0,moonshotai/Kimi-K2-Instruct-0905,log-summary-date-ranges,410.260485,True,0.8,True,410.260485 +429fe3be-ca47-4df1-a119-4a63b19cb6d5,OpenAI/gpt-oss-20B,together_ai,port-compressor,3292,16783,20075,1137.426176,False,0.0,OpenAI/gpt-oss-20B,port-compressor,1137.426176,False,0.0,False,1137.426176 +249dca27-0cc7-4d7a-b9b4-6aad31ae3139,grok-code-fast-1,xai,distribution-search,1225,450,1675,192.206809,False,0.0,grok-code-fast-1,distribution-search,192.206809,False,0.0,False,192.206809 +09f3ed25-7b78-415f-88d1-6a34fcd57659,claude-sonnet-4-20250514,anthropic,count-dataset-tokens,15780,4954,20734,870.010049,False,0.0,claude-sonnet-4-20250514,count-dataset-tokens,870.010049,False,0.0,False,870.010049 +7b38922e-e1ea-4ce6-b06f-18b800884fe5,gpt-5-nano,openai,winning-avg-corewars,31185,28836,60021,3618.29844,False,0.0,gpt-5-nano,winning-avg-corewars,3618.29844,False,0.0,False,3618.29844 +d5dba17f-42af-47c5-ba4b-2c84e3114d67,zai-org/GLM-4.5-Air-FP8,together_ai,make-doom-for-mips,17870,7069,24939,916.121096,False,0.0,zai-org/GLM-4.5-Air-FP8,make-doom-for-mips,916.121096,False,0.0,False,916.121096 +77a38917-d85a-4853-8fbd-c0af307184d5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-differential-cryptanalysis,2518,1662,4180,231.038091,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-differential-cryptanalysis,231.038091,False,0.0,False,231.038091 +1adf4074-c319-4dd8-90cf-634436a52465,gpt-5-nano,openai,crack-7z-hash,6193,2312,8505,256.013581,False,0.0,gpt-5-nano,crack-7z-hash,256.013581,False,0.0,False,256.013581 +e704bb7d-9eba-4933-acd0-dfe4bea28464,gemini-2.5-pro,gemini,circuit-fibsqrt,19985,27250,47235,3600.717217,False,0.0,gemini-2.5-pro,circuit-fibsqrt,3600.717217,False,0.0,False,3600.717217 +e6fc1e44-e6f2-4a78-97b1-39d4d7c8f08f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,train-fasttext,15356,8228,23584,3600.005803,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,train-fasttext,3600.005803,False,0.0,False,3600.005803 +57dfbc3a-5fe4-4138-ac2e-9e096cd2525e,grok-4-0709,xai,wasm-pipeline,8949,5003,13952,859.199082,True,1.0,grok-4-0709,wasm-pipeline,859.199082,True,0.4,True,859.199082 +fd0833bc-42b9-43c0-ace8-4ab501c51855,OpenAI/gpt-oss-20B,together_ai,build-initramfs-qemu,1262,868,2130,29.739768,False,0.0,OpenAI/gpt-oss-20B,build-initramfs-qemu,29.739768,False,0.0,False,29.739768 +4c5a08ad-beed-4be3-ba32-f30d3f4a178e,grok-4-0709,xai,financial-document-processor,9198,3317,12515,566.509606,False,0.0,grok-4-0709,financial-document-processor,566.509606,False,0.0,False,566.509606 +50275210-8562-48a2-972c-2e6ae755371c,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-alpine-ssh,3309,8867,12176,1046.068728,False,0.0,zai-org/GLM-4.5-Air-FP8,qemu-alpine-ssh,1046.068728,False,0.0,False,1046.068728 +35f8f37c-134f-4995-9f11-d440e6a8de25,gpt-5,openai,sqlite-with-gcov,5979,1686,7665,402.98383,False,0.0,gpt-5,sqlite-with-gcov,402.98383,False,0.3333333333333333,False,402.98383 +8312196b-b53b-48e3-a104-63dc0ce91ed3,deepseek-ai/DeepSeek-V3.1,together_ai,git-leak-recovery,3041,2575,5616,365.090115,True,1.0,deepseek-ai/DeepSeek-V3.1,git-leak-recovery,365.090115,True,0.6,True,365.090115 +3ee0e99c-ff76-460f-a80a-c7bc476c66cc,gemini-2.5-pro,gemini,qemu-startup,1162,775,1937,456.28347,True,1.0,gemini-2.5-pro,qemu-startup,456.28347,True,0.2,True,456.28347 +420d2f38-43a9-4e50-bf8b-06c33d314efc,gpt-5-mini,openai,sqlite-with-gcov,5115,1978,7093,608.153945,True,1.0,gpt-5-mini,sqlite-with-gcov,608.153945,True,1.0,True,608.153945 +f83541b9-5792-4a60-a39a-b34d5941031c,gpt-5,openai,make-doom-for-mips,13108,4631,17739,902.386841,False,0.0,gpt-5,make-doom-for-mips,902.386841,False,0.0,False,902.386841 +bf5def0b-35e3-43a1-abac-f8cbd1f16d5d,openai/gpt-oss-120b,together_ai,build-cython-ext,7302,3471,10773,912.055555,False,0.0,openai/gpt-oss-120b,build-cython-ext,912.055555,False,0.0,False,912.055555 +e06368eb-39b1-409d-a8e0-2eb9a72a6e02,gemini-2.5-pro,gemini,configure-git-webserver,5077,1087,6164,394.346769,False,0.0,gemini-2.5-pro,configure-git-webserver,394.346769,False,0.0,False,394.346769 +87b6d493-025d-45c1-aabd-618b271a3160,zai-org/GLM-4.5-Air-FP8,together_ai,install-klee-minimal,3998,2368,6366,826.878221,False,0.0,zai-org/GLM-4.5-Air-FP8,install-klee-minimal,826.878221,False,0.0,False,826.878221 +e3dd65b1-cb80-4963-8c82-707803ca8ff8,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-cli,10729,13781,24510,1997.071165,False,0.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-cli,1997.071165,False,0.0,False,1997.071165 +51779134-2afb-415c-aabb-bac628bd3e81,gemini-2.5-flash,gemini,make-doom-for-mips,18918,6018,24936,728.76104,False,0.0,gemini-2.5-flash,make-doom-for-mips,728.76104,False,0.0,False,728.76104 +fd546a0d-23fb-4821-b9cb-505c0ca04752,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-cli,5456,4643,10099,205.551128,False,0.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-cli,205.551128,False,0.0,False,205.551128 +f8150528-fc88-4b6f-969c-3069167190be,claude-sonnet-4-20250514,anthropic,form-filling,6735,5668,12403,637.550871,True,1.0,claude-sonnet-4-20250514,form-filling,637.550871,True,1.0,True,637.550871 +6e12f3dc-1378-4e86-992d-8dfad8ef555b,grok-code-fast-1,xai,feal-linear-cryptanalysis,5405,2711,8116,307.19413,False,0.0,grok-code-fast-1,feal-linear-cryptanalysis,307.19413,False,0.0,False,307.19413 +6d6b8567-42ba-4d1f-bdfa-d24dce3f87b7,zai-org/GLM-4.5-Air-FP8,together_ai,gpt2-codegolf,31630,15470,47100,901.027477,False,0.0,zai-org/GLM-4.5-Air-FP8,gpt2-codegolf,901.027477,False,0.0,False,901.027477 +ad24cf0d-4b7a-4c92-b132-9e073ff1e419,gpt-5-mini,openai,install-klee-minimal,4111,2244,6355,834.16108,False,0.0,gpt-5-mini,install-klee-minimal,834.16108,False,0.0,False,834.16108 +151a4206-4449-4589-b83d-af018ea3764a,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-c-py,23479,31460,54939,900.075737,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-c-py,900.075737,False,0.0,False,900.075737 +4bfa8dfe-29ef-405a-802f-2c7b7e7f178a,deepseek-ai/DeepSeek-V3.1,together_ai,write-compressor,8486,8557,17043,915.705531,False,0.0,deepseek-ai/DeepSeek-V3.1,write-compressor,915.705531,False,0.0,False,915.705531 +e46396d6-e548-4394-ba05-cf6e21b2cd11,OpenAI/gpt-oss-20B,together_ai,reshard-c4-data,2121,3893,6014,114.110424,False,0.0,OpenAI/gpt-oss-20B,reshard-c4-data,114.110424,False,0.0,False,114.110424 +a6cb4836-4784-458c-97e4-cf7b1276c3e7,deepseek-ai/DeepSeek-V3.1,together_ai,feal-differential-cryptanalysis,7656,7001,14657,313.832335,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-differential-cryptanalysis,313.832335,False,0.0,False,313.832335 +dac61496-2f32-4e62-9d21-57f4a92cbe78,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-with-gcov,3113,1067,4180,275.817919,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-with-gcov,275.817919,False,0.4,False,275.817919 +0d0ac6a1-3a52-47f9-a160-cef281679c0e,claude-opus-4-1-20250805,anthropic,filter-js-from-html,9831,7896,17727,297.129012,False,0.0,claude-opus-4-1-20250805,filter-js-from-html,297.129012,False,0.0,False,297.129012 +b008c349-bf1d-4b2d-8471-93a5ffc60331,deepseek-ai/DeepSeek-V3.1,together_ai,chess-best-move,3808,2559,6367,196.529202,False,0.0,deepseek-ai/DeepSeek-V3.1,chess-best-move,196.529202,False,0.0,False,196.529202 +be7142de-e7bd-4abe-adfd-bccb4cb63131,zai-org/GLM-4.5-Air-FP8,together_ai,form-filling,27983,28900,56883,934.238207,False,0.0,zai-org/GLM-4.5-Air-FP8,form-filling,934.238207,False,0.8,False,934.238207 +9b253c0b-3f1e-43ce-ae61-83b9ce41065d,gemini-2.5-pro,gemini,financial-document-processor,10241,5059,15300,546.588775,False,0.0,gemini-2.5-pro,financial-document-processor,546.588775,False,0.0,False,546.588775 +7a808293-9462-4801-a4c1-6f289c5ac9c2,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-cli,8618,4850,13468,650.269341,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-cli,650.269341,False,0.0,False,650.269341 +0ebc1507-08c2-4aa6-a7c6-a413218cf892,moonshotai/Kimi-K2-Instruct-0905,together_ai,video-processing,3927,3392,7319,499.261372,False,0.0,moonshotai/Kimi-K2-Instruct-0905,video-processing,499.261372,False,0.0,False,499.261372 +122dedad-0280-4369-84f9-8a805cf13c94,claude-sonnet-4-20250514,anthropic,constraints-scheduling,5874,3825,9699,818.115168,True,1.0,claude-sonnet-4-20250514,constraints-scheduling,818.115168,True,1.0,True,818.115168 +cae9f70b-5a9d-496a-9dc0-8cd8a818b62b,OpenAI/gpt-oss-20B,together_ai,prove-plus-comm,1217,3144,4361,81.375598,False,0.0,OpenAI/gpt-oss-20B,prove-plus-comm,81.375598,False,0.0,False,81.375598 +0f30e67a-d2c4-46eb-8611-c5db4f5d4245,openai/gpt-oss-120b,together_ai,dna-insert,19209,11256,30465,363.300554,False,0.0,openai/gpt-oss-120b,dna-insert,363.300554,False,0.0,False,363.300554 +d439f183-792a-47ed-8907-72fd2367095f,gpt-5,openai,break-filter-js-from-html,2964,1635,4599,421.532825,True,1.0,gpt-5,break-filter-js-from-html,421.532825,True,0.4285714285714285,True,421.532825 +c4655063-bd02-42e0-9495-a74111a73a7e,claude-sonnet-4-20250514,anthropic,break-filter-js-from-html,7535,7481,15016,1203.851562,False,0.0,claude-sonnet-4-20250514,break-filter-js-from-html,1203.851562,False,0.0,False,1203.851562 +eeb76996-1338-424c-9268-c8280da62777,gpt-5,openai,dna-assembly,8103,11732,19835,777.441933,False,0.0,gpt-5,dna-assembly,777.441933,False,0.0,False,777.441933 +7db68ba8-e14d-4f08-9bbb-5faa755228af,claude-sonnet-4-20250514,anthropic,mteb-retrieve,2540,2077,4617,281.241099,False,0.0,claude-sonnet-4-20250514,mteb-retrieve,281.241099,False,0.0,False,281.241099 +d1709980-2236-4d4b-9453-b01217df5aed,gemini-2.5-flash,gemini,build-cython-ext,10675,4198,14873,633.901747,False,0.0,gemini-2.5-flash,build-cython-ext,633.901747,False,0.0,False,633.901747 +1b010f11-d81d-4372-a70a-c6da40acbc70,claude-sonnet-4-20250514,anthropic,log-summary-date-ranges,13191,4460,17651,323.940119,True,1.0,claude-sonnet-4-20250514,log-summary-date-ranges,323.940119,True,1.0,True,323.940119 +5bfbcca6-221a-437e-81d2-7d00604f661d,grok-code-fast-1,xai,fix-ocaml-gc,17803,5204,23007,2073.222343,False,0.0,grok-code-fast-1,fix-ocaml-gc,2073.222343,False,0.0,False,2073.222343 +d05ac18f-8183-4bf9-8da0-5f15f07c3997,claude-opus-4-1-20250805,anthropic,filter-js-from-html,9195,6924,16119,340.037855,False,0.0,claude-opus-4-1-20250805,filter-js-from-html,340.037855,False,0.0,False,340.037855 +5fca7c12-2229-4b02-9d4d-2cefcd9d93dc,claude-sonnet-4-20250514,anthropic,reverse-engineering,37299,27780,65079,1805.487131,False,0.0,claude-sonnet-4-20250514,reverse-engineering,1805.487131,False,0.0,False,1805.487131 +de4ab92a-a3cb-4ce9-9b6d-6320e1337e40,zai-org/GLM-4.5-Air-FP8,together_ai,financial-document-processor,10385,4311,14696,413.321093,False,0.0,zai-org/GLM-4.5-Air-FP8,financial-document-processor,413.321093,False,0.0,False,413.321093 +2adc619d-8a1d-4ea0-9101-5bfa8b40e1c4,grok-code-fast-1,xai,adaptive-rejection-sampler,4741,4112,8853,567.466922,False,0.0,grok-code-fast-1,adaptive-rejection-sampler,567.466922,False,0.0,False,567.466922 +2b0e296c-80b8-44e6-8b45-c8deb9d78897,grok-4-0709,xai,hf-model-inference,7600,1799,9399,438.960544,True,1.0,grok-4-0709,hf-model-inference,438.960544,True,1.0,True,438.960544 +7997bee2-7b52-44ff-b829-eb4530aa2361,claude-sonnet-4-20250514,anthropic,install-klee-minimal,11913,2039,13952,900.559529,False,0.0,claude-sonnet-4-20250514,install-klee-minimal,900.559529,False,0.0,False,900.559529 +6f84fb8d-5818-4974-968d-064bbd6990d0,claude-opus-4-1-20250805,anthropic,financial-document-processor,13336,7904,21240,748.892467,False,0.0,claude-opus-4-1-20250805,financial-document-processor,748.892467,False,0.0,False,748.892467 +3db3e388-30cf-4a91-81d9-f335ceab06f5,grok-code-fast-1,xai,vulnerable-secret,2598,3508,6106,916.962339,False,0.0,grok-code-fast-1,vulnerable-secret,916.962339,False,0.6,False,916.962339 +85bf8056-de9d-492c-af2a-de8efa81b2ea,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,log-summary-date-ranges,9546,4163,13709,338.196541,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,log-summary-date-ranges,338.196541,True,0.8,True,338.196541 +25c1c06e-4b62-44cb-a243-aec64a207fe7,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-retrieve,1548,1712,3260,154.485415,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-retrieve,154.485415,False,0.0,False,154.485415 +46a5d097-aa06-4f7a-83af-ffbff2c96450,gemini-2.5-flash,gemini,wasm-pipeline,2075,1761,3836,111.127443,False,0.0,gemini-2.5-flash,wasm-pipeline,111.127443,False,0.4,False,111.127443 +edb0b564-8acb-4163-9cf2-d6e1e808fb80,gemini-2.5-flash,gemini,reverse-engineering,23021,19460,42481,3721.991091,False,0.0,gemini-2.5-flash,reverse-engineering,3721.991091,False,0.0,False,3721.991091 +ace70c6f-52bd-451f-9fb9-c227108a7333,claude-sonnet-4-20250514,anthropic,pytorch-model-cli,14314,5925,20239,787.452802,True,1.0,claude-sonnet-4-20250514,pytorch-model-cli,787.452802,True,0.4,True,787.452802 +15870bad-0bd8-4d33-91f3-40e29dca24a7,claude-opus-4-1-20250805,anthropic,make-doom-for-mips,42387,15405,57792,926.68805,False,0.0,claude-opus-4-1-20250805,make-doom-for-mips,926.68805,False,0.0,False,926.68805 +bf0c9adf-fc31-477b-b11d-4a636e50cc38,gpt-5-nano,openai,reshard-c4-data,2965,3474,6439,488.023741,False,0.0,gpt-5-nano,reshard-c4-data,488.023741,False,0.0,False,488.023741 +3e69bdec-98d9-4b7c-9a5c-a88eef5d2fe1,zai-org/GLM-4.5-Air-FP8,together_ai,vulnerable-secret,5454,6647,12101,912.382655,False,0.0,zai-org/GLM-4.5-Air-FP8,vulnerable-secret,912.382655,False,0.0,False,912.382655 +26170339-13cd-4381-b254-c1d8ba1b4175,claude-sonnet-4-20250514,anthropic,financial-document-processor,15010,4662,19672,597.356623,True,1.0,claude-sonnet-4-20250514,financial-document-processor,597.356623,True,0.2,True,597.356623 +be77ee40-b5f7-417c-92dc-e32ca9ca0154,gemini-2.5-flash,gemini,extract-elf,6448,5117,11565,541.481969,False,0.0,gemini-2.5-flash,extract-elf,541.481969,False,0.4,False,541.481969 +d5c42548-984b-4d57-bb93-ec1e0f3ec4dd,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,configure-git-webserver,6604,2812,9416,609.395277,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,configure-git-webserver,609.395277,True,0.6,True,609.395277 +db7c15c9-a7f1-4297-8b07-ab8c56a333eb,claude-opus-4-1-20250805,anthropic,pytorch-model-cli,8205,3933,12138,584.181164,False,0.0,claude-opus-4-1-20250805,pytorch-model-cli,584.181164,False,0.4285714285714285,False,584.181164 +6a93b939-3388-45eb-98d3-dc8e5e85a20f,gpt-5-nano,openai,winning-avg-corewars,35312,40476,75788,3618.360888,False,0.0,gpt-5-nano,winning-avg-corewars,3618.360888,False,0.0,False,3618.360888 +09378996-e8f7-4e81-9a54-2b257883276f,gemini-2.5-pro,gemini,distribution-search,10185,9166,19351,1231.011082,True,1.0,gemini-2.5-pro,distribution-search,1231.011082,True,0.6,True,1231.011082 +c8ea837c-b5ca-4bf7-9929-76d1dc27719d,claude-opus-4-1-20250805,anthropic,train-fasttext,15690,3737,19427,1977.492241,True,1.0,claude-opus-4-1-20250805,train-fasttext,1977.492241,True,0.2857142857142857,True,1977.492241 +a2d20d7e-15bc-4b35-9758-e997bd79f615,deepseek-ai/DeepSeek-V3.1,together_ai,run-pdp11-code,9026,4672,13698,1002.745341,False,0.0,deepseek-ai/DeepSeek-V3.1,run-pdp11-code,1002.745341,False,0.0,False,1002.745341 +e9c21109-98b5-4153-a6a0-5ba4b01ef7fa,gpt-5-mini,openai,cancel-async-tasks,1475,1052,2527,88.83292,False,0.0,gpt-5-mini,cancel-async-tasks,88.83292,False,0.4,False,88.83292 +0a93f725-4c04-4520-b674-abfb4666cf96,zai-org/GLM-4.5-Air-FP8,together_ai,build-cython-ext,18306,8537,26843,923.791429,False,0.0,zai-org/GLM-4.5-Air-FP8,build-cython-ext,923.791429,False,0.0,False,923.791429 +8510a9ae-e849-4868-8491-7b69003589e4,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pov-ray,31237,13379,44616,2985.378311,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pov-ray,2985.378311,False,0.2,False,2985.378311 +f181d90a-b9cd-41b1-b880-709b215f5c14,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-startup,1864,1395,3259,316.110884,True,1.0,deepseek-ai/DeepSeek-V3.1,qemu-startup,316.110884,True,0.2,True,316.110884 +44584cfe-51c7-4710-a675-0f444937a90e,gemini-2.5-pro,gemini,train-fasttext,31819,8446,40265,3607.245154,False,0.0,gemini-2.5-pro,train-fasttext,3607.245154,False,0.0,False,3607.245154 +a9186817-c1f5-46c5-b9a1-44269c5712c8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-cli,8198,3771,11969,1174.397936,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-cli,1174.397936,False,0.0,False,1174.397936 +5e80d518-20df-4262-bf89-ef61cfa5af80,gemini-2.5-flash,gemini,pytorch-model-cli,16941,5284,22225,887.785892,False,0.0,gemini-2.5-flash,pytorch-model-cli,887.785892,False,0.0,False,887.785892 +9393fcd9-2ad1-416a-b62c-82009c277103,gpt-5-mini,openai,crack-7z-hash,1171,800,1971,68.630062,False,0.0,gpt-5-mini,crack-7z-hash,68.630062,False,0.0,False,68.630062 +f4a635bb-c4ef-4bef-a2a9-5bf0a4b993e3,claude-sonnet-4-20250514,anthropic,tune-mjcf,9794,8155,17949,900.090081,False,0.0,claude-sonnet-4-20250514,tune-mjcf,900.090081,False,0.2,False,900.090081 +3520488f-e4de-4191-9494-7d44164f44eb,claude-opus-4-1-20250805,anthropic,make-mips-interpreter,26447,24173,50620,1804.123265,False,0.0,claude-opus-4-1-20250805,make-mips-interpreter,1804.123265,False,0.0,False,1804.123265 +3158c005-9fc2-4761-bf22-aaa84e59462b,claude-opus-4-1-20250805,anthropic,code-from-image,18206,19455,37661,1204.245047,False,0.0,claude-opus-4-1-20250805,code-from-image,1204.245047,False,0.125,False,1204.245047 +d58a0742-3aac-4205-8809-bbd6a2dd6e0c,gemini-2.5-flash,gemini,tune-mjcf,8245,11574,19819,579.517125,False,0.0,gemini-2.5-flash,tune-mjcf,579.517125,False,0.6,False,579.517125 +b633aacc-dcff-4f8e-a650-7d1d0f72092d,gpt-5,openai,train-fasttext,16745,7341,24086,3621.195862,False,0.0,gpt-5,train-fasttext,3621.195862,False,0.0,False,3621.195862 +0b00c9f8-4f8a-4583-bdde-4b1ad6d8e374,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-with-gcov,11213,3228,14441,573.841481,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-with-gcov,573.841481,True,0.6,True,573.841481 +2e51ad5d-5c3a-4d14-8926-48ae06a8c5b3,gpt-5-nano,openai,path-tracing,6390,1542,7932,233.00758,False,0.0,gpt-5-nano,path-tracing,233.00758,False,0.2,False,233.00758 +8bff6887-db91-45f7-993c-fe9a6b11124f,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-doom-for-mips,5988,1645,7633,186.107043,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-doom-for-mips,186.107043,False,0.0,False,186.107043 +db5b5d4b-0dda-450d-85f5-dc573787c304,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,write-compressor,1706,2372,4078,306.709834,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,write-compressor,306.709834,False,0.0,False,306.709834 +d8bb51cf-591b-4add-9c91-a00e08a3bd83,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-doom-for-mips,16577,4327,20904,908.135969,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-doom-for-mips,908.135969,False,0.0,False,908.135969 +e6c8abcb-daf4-4127-871f-2215a4557d21,openai/gpt-oss-120b,together_ai,sqlite-db-truncate,1191,898,2089,160.282328,False,0.0,openai/gpt-oss-120b,sqlite-db-truncate,160.282328,False,0.0,False,160.282328 +8c63a47d-8b03-41a2-99cb-620cd38bbffb,deepseek-ai/DeepSeek-V3.1,together_ai,torch-tensor-parallelism,2448,1299,3747,179.24029,False,0.0,deepseek-ai/DeepSeek-V3.1,torch-tensor-parallelism,179.24029,False,0.0,False,179.24029 +cc1766a1-f6e5-47c5-95b1-7bb245917dda,gpt-5-nano,openai,git-leak-recovery,4794,5297,10091,902.702985,False,0.0,gpt-5-nano,git-leak-recovery,902.702985,False,0.0,False,902.702985 +4b289235-81f9-4b0b-8d19-6da18dbb94df,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,large-scale-text-editing,2531,4246,6777,497.648655,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,large-scale-text-editing,497.648655,False,0.0,False,497.648655 +dcacb5e0-8329-490c-8a9f-730e0e2a6202,OpenAI/gpt-oss-20B,together_ai,form-filling,168,1205,1373,178.350158,False,0.0,OpenAI/gpt-oss-20B,form-filling,178.350158,False,0.0,False,178.350158 +5251c4dd-3473-4146-896d-aa917a4ae002,gemini-2.5-pro,gemini,make-doom-for-mips,15361,3294,18655,901.588419,False,0.0,gemini-2.5-pro,make-doom-for-mips,901.588419,False,0.0,False,901.588419 +09166cd3-0460-46df-9232-8f16174a02ae,gemini-2.5-flash,gemini,sanitize-git-repo,11042,2250,13292,139.677482,False,0.0,gemini-2.5-flash,sanitize-git-repo,139.677482,False,0.0,False,139.677482 +64ce5bed-560f-46fb-bc68-cea7f9de44e9,gpt-5-nano,openai,install-klee-minimal,8347,3055,11402,900.045389,False,0.0,gpt-5-nano,install-klee-minimal,900.045389,False,0.0,False,900.045389 +441619e3-540b-4963-acb5-80288d17c72c,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-retrieve,2473,1119,3592,230.947369,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-retrieve,230.947369,False,0.0,False,230.947369 +616ac75f-f0af-4a56-87bb-8dbe5eb21356,OpenAI/gpt-oss-20B,together_ai,write-compressor,3566,14656,18222,900.483195,False,0.0,OpenAI/gpt-oss-20B,write-compressor,900.483195,False,0.0,False,900.483195 +6817b652-2442-42d8-8e5e-1c98b65b7a39,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pov-ray,25325,7277,32602,986.831139,True,1.0,moonshotai/Kimi-K2-Instruct-0905,build-pov-ray,986.831139,True,1.0,True,986.831139 +76908251-b3f3-45e1-89a9-ab9016be7d87,moonshotai/Kimi-K2-Instruct-0905,together_ai,sparql-university,5878,2773,8651,316.709093,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sparql-university,316.709093,False,0.0,False,316.709093 +0f834879-7a7c-4a93-b58d-a0151c8db4b3,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-rust-c,13314,15541,28855,928.712501,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-rust-c,928.712501,False,0.0,False,928.712501 +1db09e50-1b46-4805-89d6-334e42b3459e,moonshotai/Kimi-K2-Instruct-0905,together_ai,reshard-c4-data,7710,5854,13564,717.6119,False,0.0,moonshotai/Kimi-K2-Instruct-0905,reshard-c4-data,717.6119,False,0.0,False,717.6119 +f787959a-c1fd-4758-80d5-67259eb0c4ec,gemini-2.5-pro,gemini,wasm-pipeline,6687,2424,9111,529.520143,False,0.0,gemini-2.5-pro,wasm-pipeline,529.520143,False,0.0,False,529.520143 +9573e490-64f2-499d-b7ed-c24a03122753,gpt-5,openai,fix-git,4412,1623,6035,267.159951,True,1.0,gpt-5,fix-git,267.159951,True,1.0,True,267.159951 +86b0af8c-30e0-449b-9cc1-fb379c5a4a64,gpt-5-mini,openai,model-extraction-relu-logits,3620,10449,14069,931.484553,False,0.0,gpt-5-mini,model-extraction-relu-logits,931.484553,False,0.0,False,931.484553 +cc16e299-1e99-4e4c-9fff-506d05a1f9f8,gpt-5-nano,openai,reverse-engineering,26314,15911,42225,1803.798913,False,0.0,gpt-5-nano,reverse-engineering,1803.798913,False,0.0,False,1803.798913 +f7dd705a-694e-4d11-95e3-53aadb3f1c91,claude-opus-4-1-20250805,anthropic,sqlite-db-truncate,7871,6320,14191,342.057067,True,1.0,claude-opus-4-1-20250805,sqlite-db-truncate,342.057067,True,0.125,True,342.057067 +5e548c0f-6dae-4f6c-98e0-e4d9ffb1ef17,deepseek-ai/DeepSeek-V3.1,together_ai,sparql-university,8362,4158,12520,244.162693,False,0.0,deepseek-ai/DeepSeek-V3.1,sparql-university,244.162693,False,0.0,False,244.162693 +bfa3ff3d-20f5-4f74-baf1-8a3eb13a3e60,claude-opus-4-1-20250805,anthropic,pytorch-model-cli,29397,11811,41208,638.278229,True,1.0,claude-opus-4-1-20250805,pytorch-model-cli,638.278229,True,0.4285714285714285,True,638.278229 +c7c2e000-4711-495b-bfab-7d5305a3acc1,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing-reverse,9331,8327,17658,2057.761833,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing-reverse,2057.761833,False,0.0,False,2057.761833 +64d05522-b573-4fa1-b5f3-bb3a165e6cb1,OpenAI/gpt-oss-20B,together_ai,sqlite-with-gcov,16657,17281,33938,900.741708,False,0.0,OpenAI/gpt-oss-20B,sqlite-with-gcov,900.741708,False,0.0,False,900.741708 +b5ebf97b-c60d-46f7-abd8-9adade242286,gpt-5-mini,openai,prove-plus-comm,1804,1393,3197,208.739091,True,1.0,gpt-5-mini,prove-plus-comm,208.739091,True,0.6,True,208.739091 +c35af1fe-f108-44d3-9c07-c30d9bfd3fb2,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,configure-git-webserver,5204,1535,6739,712.381094,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,configure-git-webserver,712.381094,True,0.6,True,712.381094 +eebfbd38-57e9-4bde-82db-d613e109da51,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,write-compressor,28593,13316,41909,951.187845,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,write-compressor,951.187845,False,0.0,False,951.187845 +2d5a8aa2-5da4-481f-8904-73106e06fd73,gemini-2.5-pro,gemini,fix-code-vulnerability,8349,1619,9968,530.373659,True,1.0,gemini-2.5-pro,fix-code-vulnerability,530.373659,True,0.2,True,530.373659 +703cef0a-8a76-489b-8c63-9a9e8c553222,grok-4-0709,xai,port-compressor,37994,28499,66493,3623.846709,False,0.0,grok-4-0709,port-compressor,3623.846709,False,0.0,False,3623.846709 +1a85ecba-8e29-4b23-bc07-7cfae5a16c87,claude-sonnet-4-20250514,anthropic,pytorch-model-cli,13354,5424,18778,805.782644,True,1.0,claude-sonnet-4-20250514,pytorch-model-cli,805.782644,True,0.4,True,805.782644 +91a20918-7096-4cd0-9d89-6445f31713a8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cancel-async-tasks,1378,871,2249,68.728694,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cancel-async-tasks,68.728694,False,0.8,False,68.728694 +ec4dcdd3-8707-4b40-8d23-c33b6968810a,claude-sonnet-4-20250514,anthropic,feal-differential-cryptanalysis,22202,20675,42877,1800.00256,False,0.0,claude-sonnet-4-20250514,feal-differential-cryptanalysis,1800.00256,False,0.0,False,1800.00256 +c85b9d3f-fb1a-48a0-8406-da6aa1b5060d,gemini-2.5-pro,gemini,schemelike-metacircular-eval,15345,33078,48423,2405.495779,False,0.0,gemini-2.5-pro,schemelike-metacircular-eval,2405.495779,False,0.0,False,2405.495779 +2144d0be-61d2-469b-9142-825062a18ced,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-mips-interpreter,22516,15824,38340,1843.855607,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-mips-interpreter,1843.855607,False,0.0,False,1843.855607 +20e3922f-8209-4f2d-bdb4-5d895e088d21,gpt-5-mini,openai,dna-insert,6236,4060,10296,360.669975,False,0.0,gpt-5-mini,dna-insert,360.669975,False,0.0,False,360.669975 +dc10df82-13c8-4561-8a00-f9d41d73eb40,grok-4-0709,xai,tune-mjcf,6274,5506,11780,900.081627,False,0.0,grok-4-0709,tune-mjcf,900.081627,False,0.0,False,900.081627 +bca32fb4-5f4a-41fe-8de0-1e7b9508cee5,gpt-5-nano,openai,write-compressor,4202,2697,6899,908.091282,False,0.0,gpt-5-nano,write-compressor,908.091282,False,0.0,False,908.091282 +59e8ab15-2727-47bc-b462-17d43641a1a8,gemini-2.5-pro,gemini,wasm-pipeline,7112,2861,9973,293.04408,False,0.0,gemini-2.5-pro,wasm-pipeline,293.04408,False,0.0,False,293.04408 +197474e1-66e3-4831-bff5-7780c42bce68,gpt-5-mini,openai,tune-mjcf,15581,8668,24249,945.399334,False,0.0,gpt-5-mini,tune-mjcf,945.399334,False,0.0,False,945.399334 +ec4ddbaa-eafa-4e8a-bd90-de2255a52fa7,gemini-2.5-pro,gemini,model-extraction-relu-logits,1901,1658,3559,1419.73534,False,0.0,gemini-2.5-pro,model-extraction-relu-logits,1419.73534,False,0.0,False,1419.73534 +23db9073-d24e-49a2-8daa-1675270722e1,gpt-5,openai,reverse-engineering,13248,5818,19066,921.824824,True,1.0,gpt-5,reverse-engineering,921.824824,True,0.6666666666666666,True,921.824824 +a7a908e7-31e2-40e0-aa16-d2a86f9dfcc2,gpt-5-nano,openai,crack-7z-hash,15381,6945,22326,492.663071,False,0.0,gpt-5-nano,crack-7z-hash,492.663071,False,0.0,False,492.663071 +e456e088-f414-4e9b-b591-afe167b303f5,grok-code-fast-1,xai,dna-insert,8170,2099,10269,385.976852,False,0.0,grok-code-fast-1,dna-insert,385.976852,False,0.0,False,385.976852 +8bf231b1-040a-4d2c-b85d-f34555e38d77,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,large-scale-text-editing,3763,1507,5270,251.051767,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,large-scale-text-editing,251.051767,False,0.0,False,251.051767 +68ecacf5-967f-4103-bb31-76686db36f44,claude-sonnet-4-20250514,anthropic,build-pov-ray,20102,7766,27868,1883.394436,False,0.0,claude-sonnet-4-20250514,build-pov-ray,1883.394436,False,0.6,False,1883.394436 +cc582766-9a2c-46ed-b83a-d74c60fa5658,gpt-5,openai,sanitize-git-repo,6056,5257,11313,900.094246,False,0.0,gpt-5,sanitize-git-repo,900.094246,False,0.2857142857142857,False,900.094246 +cea91da9-81c5-46ba-a157-da8ea000859c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,openssl-selfsigned-cert,1674,1224,2898,113.553917,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,openssl-selfsigned-cert,113.553917,False,0.0,False,113.553917 +c9def2a7-04c6-4772-aae9-c28ee2af7d05,OpenAI/gpt-oss-20B,together_ai,pytorch-model-recovery,844,1708,2552,81.888132,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-recovery,81.888132,False,0.0,False,81.888132 +cb1205e5-f7f4-43c4-b0fd-cd5768282a88,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-recovery,13080,9886,22966,900.045265,True,1.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-recovery,900.045265,True,0.4,True,900.045265 +8751a7d3-425e-44f5-8eb5-19bc6a9ad8b5,deepseek-ai/DeepSeek-V3.1,together_ai,make-mips-interpreter,23759,17841,41600,1831.131574,False,0.0,deepseek-ai/DeepSeek-V3.1,make-mips-interpreter,1831.131574,False,0.0,False,1831.131574 +3b7e8481-8328-4487-a89b-81bd84ddb83a,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-retrieve,3721,3034,6755,375.925406,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-retrieve,375.925406,False,0.0,False,375.925406 +33c3b258-b34a-4df9-925c-971684edf076,claude-sonnet-4-20250514,anthropic,path-tracing-reverse,10016,9421,19437,1093.46063,False,0.0,claude-sonnet-4-20250514,path-tracing-reverse,1093.46063,False,0.0,False,1093.46063 +0fd3a1d6-910d-42ef-8bfd-b447bbb9a98d,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-cython-ext,23168,7006,30174,792.514784,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-cython-ext,792.514784,False,0.0,False,792.514784 +52b01561-521e-4cf5-bf56-e9072b67c238,gpt-5-mini,openai,mteb-leaderboard,15293,37258,52551,3602.489237,False,0.0,gpt-5-mini,mteb-leaderboard,3602.489237,False,0.0,False,3602.489237 +dc0a9892-35d4-48b7-b7dc-d6839b616d36,gpt-5,openai,bn-fit-modify,12779,12616,25395,782.229744,True,1.0,gpt-5,bn-fit-modify,782.229744,True,0.5,True,782.229744 +d709b652-fce6-4d3b-8dd2-eb88402bf317,grok-code-fast-1,xai,build-initramfs-qemu,2157,1445,3602,138.400149,False,0.0,grok-code-fast-1,build-initramfs-qemu,138.400149,False,0.0,False,138.400149 +ea269c16-b482-46ed-9c5d-a6b39001f60b,deepseek-ai/DeepSeek-V3.1,together_ai,extract-elf,10830,1240,12070,298.164443,True,1.0,deepseek-ai/DeepSeek-V3.1,extract-elf,298.164443,True,0.6,True,298.164443 +470630eb-8d41-48ef-ab42-92678266fc54,grok-4-0709,xai,install-klee-minimal,9835,2774,12609,902.858161,False,0.0,grok-4-0709,install-klee-minimal,902.858161,False,0.0,False,902.858161 +d533451c-1bcf-4296-b702-3cc9dbcf5a72,OpenAI/gpt-oss-20B,together_ai,install-windows-3.11,13795,56891,70686,3606.884224,False,0.0,OpenAI/gpt-oss-20B,install-windows-3.11,3606.884224,False,0.0,False,3606.884224 +0cd89299-0805-434f-b281-fb01f768a7e6,grok-code-fast-1,xai,large-scale-text-editing,4101,4278,8379,558.664554,False,0.0,grok-code-fast-1,large-scale-text-editing,558.664554,False,0.0,False,558.664554 +39233179-868d-403a-8e48-6fbe668b79d9,claude-sonnet-4-20250514,anthropic,adaptive-rejection-sampler,11671,8877,20548,900.046848,False,0.0,claude-sonnet-4-20250514,adaptive-rejection-sampler,900.046848,False,0.0,False,900.046848 +07d56ad8-ccef-4c2a-b468-80ee37717f98,gpt-5,openai,feal-linear-cryptanalysis,11200,6378,17578,860.564152,True,1.0,gpt-5,feal-linear-cryptanalysis,860.564152,True,1.0,True,860.564152 +687f2dbe-36ce-4b71-9420-986a58a1c2cf,grok-4-0709,xai,db-wal-recovery,1835,1874,3709,1019.140304,False,0.0,grok-4-0709,db-wal-recovery,1019.140304,False,0.2,False,1019.140304 +b1e3d7a6-61f6-4b8d-bd3a-fa8314e7955a,grok-4-0709,xai,nginx-request-logging,3817,1637,5454,396.256201,True,1.0,grok-4-0709,nginx-request-logging,396.256201,True,1.0,True,396.256201 +66bd91ee-0855-4753-ad0f-ab6ae82509d0,gemini-2.5-flash,gemini,qemu-startup,1114,1304,2418,232.744757,False,0.0,gemini-2.5-flash,qemu-startup,232.744757,False,0.2,False,232.744757 +bfa8776a-80a9-415d-852c-96443f9b1d53,OpenAI/gpt-oss-20B,together_ai,adaptive-rejection-sampler,1984,1900,3884,85.64665,False,0.0,OpenAI/gpt-oss-20B,adaptive-rejection-sampler,85.64665,False,0.0,False,85.64665 +ad923874-ba26-47b4-910b-65c45878a365,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-rust-c,11334,12674,24008,903.469799,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-rust-c,903.469799,False,0.0,False,903.469799 +108d5a4c-f6b6-4102-be4b-cfd5930c70ff,claude-sonnet-4-20250514,anthropic,chess-best-move,6343,5720,12063,369.575414,False,0.0,claude-sonnet-4-20250514,chess-best-move,369.575414,False,0.0,False,369.575414 +0c394b1a-a690-49f9-be61-cf37e6087d29,gpt-5,openai,extract-elf,4446,3763,8209,303.231561,False,0.0,gpt-5,extract-elf,303.231561,False,0.2857142857142857,False,303.231561 +da706fb1-2911-44ce-9a5d-38d12e5dc16d,grok-4-0709,xai,form-filling,2898,1895,4793,248.24216,False,0.0,grok-4-0709,form-filling,248.24216,False,0.2,False,248.24216 +6dde1c14-c37f-4421-810b-912e270dc377,grok-4-0709,xai,git-leak-recovery,1281,947,2228,503.906558,False,0.0,grok-4-0709,git-leak-recovery,503.906558,False,0.4,False,503.906558 +6ca070b1-3979-4e06-ad4c-03d2614ce63e,zai-org/GLM-4.5-Air-FP8,together_ai,video-processing,9989,10175,20164,527.88485,False,0.0,zai-org/GLM-4.5-Air-FP8,video-processing,527.88485,False,0.0,False,527.88485 +2800688d-d825-43c9-9584-d6441e64b32a,gpt-5-mini,openai,make-mips-interpreter,10019,18743,28762,1830.205166,False,0.0,gpt-5-mini,make-mips-interpreter,1830.205166,False,0.0,False,1830.205166 +08a8ff7f-b681-4427-85a6-5fc5c4ecaeb4,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,chess-best-move,10327,5451,15778,744.059469,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,chess-best-move,744.059469,False,0.0,False,744.059469 +8e5635ca-df06-441e-b8a6-97135f191b69,openai/gpt-oss-120b,together_ai,fix-ocaml-gc,31600,12428,44028,3607.898232,False,0.0,openai/gpt-oss-120b,fix-ocaml-gc,3607.898232,False,0.0,False,3607.898232 +d5595a8e-5357-4d81-b28e-773ef9c34798,grok-4-0709,xai,build-pmars,17437,4890,22327,926.181533,True,1.0,grok-4-0709,build-pmars,926.181533,True,0.2,True,926.181533 +d84c23f3-dccb-4731-9ef9-9ced1bc7aae1,gemini-2.5-flash,gemini,sanitize-git-repo,11938,2928,14866,405.136463,False,0.0,gemini-2.5-flash,sanitize-git-repo,405.136463,False,0.0,False,405.136463 +8e527883-3aea-4182-89af-29ef15c567a3,gemini-2.5-flash,gemini,hf-model-inference,6414,2180,8594,254.420101,True,1.0,gemini-2.5-flash,hf-model-inference,254.420101,True,0.6,True,254.420101 +e32f2f33-7357-44c4-bbfd-ffc05f06fc59,gpt-5-mini,openai,mteb-leaderboard,41719,37388,79107,3608.335784,False,0.0,gpt-5-mini,mteb-leaderboard,3608.335784,False,0.0,False,3608.335784 +a4b07c7e-19bc-4c3b-aac3-30770b583772,moonshotai/Kimi-K2-Instruct-0905,together_ai,largest-eigenval,9841,9048,18889,729.444764,False,0.0,moonshotai/Kimi-K2-Instruct-0905,largest-eigenval,729.444764,False,0.2,False,729.444764 +928f7549-3088-44e1-8527-b7e0dc56f3a9,openai/gpt-oss-120b,together_ai,reshard-c4-data,6152,2273,8425,199.423086,False,0.0,openai/gpt-oss-120b,reshard-c4-data,199.423086,False,0.0,False,199.423086 +5f761415-d533-4866-bc22-f2e2a7ed409b,gpt-5-mini,openai,largest-eigenval,18929,10065,28994,924.020696,False,0.0,gpt-5-mini,largest-eigenval,924.020696,False,0.0,False,924.020696 +77cfe204-6dfc-493b-b593-19f9bf76f5ad,grok-code-fast-1,xai,log-summary-date-ranges,3946,1861,5807,96.015003,False,0.0,grok-code-fast-1,log-summary-date-ranges,96.015003,False,0.0,False,96.015003 +92bebbe6-466e-40b7-ad70-6e3ad01a9e1c,claude-sonnet-4-20250514,anthropic,cobol-modernization,5118,3325,8443,900.524519,True,1.0,claude-sonnet-4-20250514,cobol-modernization,900.524519,True,1.0,True,900.524519 +bee2c417-be6a-4319-a1e1-3895a2989929,gpt-5,openai,log-summary-date-ranges,6733,2278,9011,141.897095,False,0.0,gpt-5,log-summary-date-ranges,141.897095,False,0.0,False,141.897095 +98d2a0be-9a5b-43a5-a75f-6680a60e9d28,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-assembly,11763,6841,18604,339.335305,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-assembly,339.335305,False,0.0,False,339.335305 +8c930c71-8f4d-4673-a961-0df31f2c83c0,gemini-2.5-flash,gemini,train-fasttext,38315,15229,53544,3602.355845,False,0.0,gemini-2.5-flash,train-fasttext,3602.355845,False,0.0,False,3602.355845 +eb866939-d739-4f8e-a0cf-fd37f4f8918e,openai/gpt-oss-120b,together_ai,pypi-server,3288,931,4219,102.815255,True,1.0,openai/gpt-oss-120b,pypi-server,102.815255,True,0.4,True,102.815255 +0ed43a97-778c-433d-b238-7855ec636746,gpt-5-mini,openai,form-filling,12026,10994,23020,676.625062,True,1.0,gpt-5-mini,form-filling,676.625062,True,1.0,True,676.625062 +808cac95-e8ad-44e6-871c-2e0cf4f40e00,gpt-5-mini,openai,password-recovery,3098,6524,9622,909.924695,False,0.0,gpt-5-mini,password-recovery,909.924695,False,0.0,False,909.924695 +8d3b5229-627f-49e0-bc79-2690c6c1235b,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-doom-for-mips,22211,6316,28527,901.27387,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-doom-for-mips,901.27387,False,0.0,False,901.27387 +e2f35e70-9e70-4ef9-a116-e7ac7ca5034c,claude-opus-4-1-20250805,anthropic,mteb-retrieve,2570,1503,4073,567.384364,False,0.0,claude-opus-4-1-20250805,mteb-retrieve,567.384364,False,0.0,False,567.384364 +4b634c45-a1f4-4ab2-abd9-997754f63ec4,gpt-5-nano,openai,winning-avg-corewars,14816,12614,27430,3635.756976,False,0.0,gpt-5-nano,winning-avg-corewars,3635.756976,False,0.0,False,3635.756976 +f9402f1d-67fe-4233-a686-9ff67787619b,grok-code-fast-1,xai,configure-git-webserver,4783,1060,5843,159.346256,False,0.0,grok-code-fast-1,configure-git-webserver,159.346256,False,0.0,False,159.346256 +2735f797-6ff8-4133-b974-3c9b64806e5a,deepseek-ai/DeepSeek-V3.1,together_ai,video-processing,3607,3644,7251,321.598354,False,0.0,deepseek-ai/DeepSeek-V3.1,video-processing,321.598354,False,0.0,False,321.598354 +9ef00f16-ed04-43ab-a38c-cf44c5f68db1,OpenAI/gpt-oss-20B,together_ai,filter-js-from-html,1180,462,1642,23.847287,False,0.0,OpenAI/gpt-oss-20B,filter-js-from-html,23.847287,False,0.0,False,23.847287 +7d2b6597-4f90-48f0-873d-d9d842cdfb62,gpt-5,openai,adaptive-rejection-sampler,4540,19370,23910,900.063841,True,1.0,gpt-5,adaptive-rejection-sampler,900.063841,True,0.4,True,900.063841 +b16129eb-7d7d-4b46-85d6-3d63ee08bfe7,gpt-5-mini,openai,build-pov-ray,17626,37135,54761,6005.852133,False,0.0,gpt-5-mini,build-pov-ray,6005.852133,False,0.0,False,6005.852133 +27f8e549-810e-4c14-ad4b-72fa01b28fc1,claude-sonnet-4-20250514,anthropic,port-compressor,51536,29597,81133,2872.485564,True,1.0,claude-sonnet-4-20250514,port-compressor,2872.485564,True,0.2,True,2872.485564 +4c683ab1-5dcc-47ea-af28-3d921842ce2c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-startup,1668,1582,3250,96.133406,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-startup,96.133406,False,0.4,False,96.133406 +d4a9c83e-4eca-4b21-8064-0d0bedec6413,grok-code-fast-1,xai,sanitize-git-repo,3017,2163,5180,143.342077,False,0.0,grok-code-fast-1,sanitize-git-repo,143.342077,False,0.0,False,143.342077 +c5e70346-269f-42d7-b983-310c86ca648e,grok-4-0709,xai,install-klee-minimal,7682,3879,11561,900.094078,False,0.0,grok-4-0709,install-klee-minimal,900.094078,False,0.0,False,900.094078 +f943eb17-38ec-45d7-9156-57dc16ed976d,claude-sonnet-4-20250514,anthropic,sqlite-with-gcov,12258,2722,14980,1001.348478,False,0.0,claude-sonnet-4-20250514,sqlite-with-gcov,1001.348478,False,0.2,False,1001.348478 +05b9a65e-21a9-486e-b774-3cb081b1da3f,openai/gpt-oss-120b,together_ai,large-scale-text-editing,4407,2300,6707,124.59175,False,0.0,openai/gpt-oss-120b,large-scale-text-editing,124.59175,False,0.0,False,124.59175 +18ce2677-8cbc-4790-83ac-7c6cdf1d5359,grok-4-0709,xai,dna-assembly,5142,830,5972,749.650645,False,0.0,grok-4-0709,dna-assembly,749.650645,False,0.0,False,749.650645 +f6e473ff-febe-4b9d-bce1-5289638617a9,gemini-2.5-pro,gemini,dna-assembly,7289,3158,10447,749.84186,False,0.0,gemini-2.5-pro,dna-assembly,749.84186,False,0.0,False,749.84186 +c1240fdb-3584-4259-b968-0f7319f290ef,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,wasm-pipeline,5320,5754,11074,902.518384,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,wasm-pipeline,902.518384,False,0.6,False,902.518384 +a865970a-4067-4a13-baa9-2a2f3f56922e,zai-org/GLM-4.5-Air-FP8,together_ai,reverse-engineering,10138,19489,29627,1828.789441,False,0.0,zai-org/GLM-4.5-Air-FP8,reverse-engineering,1828.789441,False,0.0,False,1828.789441 +835ca73b-5497-444b-9c4d-54011f0f99ca,gpt-5-nano,openai,code-from-image,5080,1754,6834,153.95484,False,0.0,gpt-5-nano,code-from-image,153.95484,False,0.0,False,153.95484 +4bbc06d6-d03e-4130-87fb-62b645f8230e,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing-reverse,22085,6253,28338,698.288089,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing-reverse,698.288089,False,0.0,False,698.288089 +cbabe714-548d-4301-9c53-92d701deb332,gpt-5-mini,openai,bn-fit-modify,3432,3046,6478,234.143162,False,0.0,gpt-5-mini,bn-fit-modify,234.143162,False,0.6,False,234.143162 +ccd7f8f1-eac1-492b-b061-23898aa8af24,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pov-ray,25766,9990,35756,3975.188471,True,1.0,moonshotai/Kimi-K2-Instruct-0905,build-pov-ray,3975.188471,True,1.0,True,3975.188471 +0b052031-7b5f-4406-95cf-d6f2e4be43d3,grok-code-fast-1,xai,feal-differential-cryptanalysis,4809,4482,9291,472.351033,False,0.0,grok-code-fast-1,feal-differential-cryptanalysis,472.351033,False,0.0,False,472.351033 +322c02c4-bcc0-4158-a235-37f217ecdd04,openai/gpt-oss-120b,together_ai,mteb-leaderboard,966,270,1236,15.610789,False,0.0,openai/gpt-oss-120b,mteb-leaderboard,15.610789,False,0.0,False,15.610789 +4f14594b-ded0-409e-b094-79b86b4fe4cc,openai/gpt-oss-120b,together_ai,dna-insert,10530,8358,18888,393.16437,False,0.0,openai/gpt-oss-120b,dna-insert,393.16437,False,0.0,False,393.16437 +ab35bc21-50bb-49b3-8320-275df99d315e,OpenAI/gpt-oss-20B,together_ai,form-filling,168,1544,1712,60.368895,False,0.0,OpenAI/gpt-oss-20B,form-filling,60.368895,False,0.0,False,60.368895 +10dfff30-00b3-43d0-a2c2-c2cad7fb6bb0,gpt-5-nano,openai,gpt2-codegolf,3066,5667,8733,901.495722,False,0.0,gpt-5-nano,gpt2-codegolf,901.495722,False,0.0,False,901.495722 +84a5e354-25f2-4b2d-b56c-12fa33c19d86,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-mips-interpreter,26805,18252,45057,1807.752178,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-mips-interpreter,1807.752178,False,0.0,False,1807.752178 +6e747ca1-f4aa-4db0-8116-0eefe733abaf,openai/gpt-oss-120b,together_ai,train-fasttext,12949,7016,19965,1404.93066,False,0.0,openai/gpt-oss-120b,train-fasttext,1404.93066,False,0.0,False,1404.93066 +8c29090d-c415-4479-b812-8694e1524f1f,claude-opus-4-1-20250805,anthropic,git-leak-recovery,2670,1619,4289,228.257215,True,1.0,claude-opus-4-1-20250805,git-leak-recovery,228.257215,True,1.0,True,228.257215 +0c28f9c0-dec1-4d7b-a172-f819173a3ceb,gpt-5,openai,gpt2-codegolf,10104,9279,19383,795.122958,False,0.0,gpt-5,gpt2-codegolf,795.122958,False,0.0,False,795.122958 +b861f4d6-3b62-4352-b87f-7b95eb997c42,gpt-5,openai,sanitize-git-repo,11229,5009,16238,812.035069,False,0.0,gpt-5,sanitize-git-repo,812.035069,False,0.2857142857142857,False,812.035069 +bce7f833-aae9-449f-b3dd-e7f4973f4ebb,gemini-2.5-pro,gemini,qemu-alpine-ssh,3516,4251,7767,842.572021,True,1.0,gemini-2.5-pro,qemu-alpine-ssh,842.572021,True,0.2,True,842.572021 +2eabf22c-5d87-47e9-a8bd-1cf0941e750b,openai/gpt-oss-120b,together_ai,polyglot-rust-c,1358,733,2091,92.649689,False,0.0,openai/gpt-oss-120b,polyglot-rust-c,92.649689,False,0.0,False,92.649689 +ad2eb0e5-ef69-4731-acff-d21a23053218,gpt-5-nano,openai,reverse-engineering,21441,10437,31878,1827.004584,False,0.0,gpt-5-nano,reverse-engineering,1827.004584,False,0.0,False,1827.004584 +04ab7c9f-ce5c-46d2-a7da-d512fd63f9ca,moonshotai/Kimi-K2-Instruct-0905,together_ai,sparql-university,10247,6628,16875,413.753981,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sparql-university,413.753981,False,0.0,False,413.753981 +3813e183-9d73-45ce-b6d7-5a788973cb85,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pov-ray,18172,6496,24668,1781.657345,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pov-ray,1781.657345,False,0.0,False,1781.657345 +dc5ead54-0bd0-4d4c-b205-16942ee6b0b3,claude-opus-4-1-20250805,anthropic,filter-js-from-html,8268,7429,15697,853.078775,False,0.0,claude-opus-4-1-20250805,filter-js-from-html,853.078775,False,0.0,False,853.078775 +25ecb3c8-99b2-4212-a3cc-4e8e3de85bce,gemini-2.5-pro,gemini,tune-mjcf,7081,7603,14684,902.748268,False,0.0,gemini-2.5-pro,tune-mjcf,902.748268,False,0.2,False,902.748268 +4801255f-93bb-4a2d-bd2c-d38c10b9a2e6,gpt-5-mini,openai,count-dataset-tokens,9959,9372,19331,900.058877,False,0.0,gpt-5-mini,count-dataset-tokens,900.058877,False,0.0,False,900.058877 +bb47de03-a41f-40bd-8987-b98c7c77e614,gpt-5-nano,openai,mteb-retrieve,7730,6876,14606,499.205285,False,0.0,gpt-5-nano,mteb-retrieve,499.205285,False,0.0,False,499.205285 +26171d54-02e8-46cd-9800-600bc07d26ff,grok-4-0709,xai,crack-7z-hash,9412,3918,13330,664.890356,True,1.0,grok-4-0709,crack-7z-hash,664.890356,True,0.8,True,664.890356 +cec472fd-4d5a-45c9-8be9-bf71e0c16b49,claude-opus-4-1-20250805,anthropic,regex-log,3306,2886,6192,198.077775,True,1.0,claude-opus-4-1-20250805,regex-log,198.077775,True,0.5714285714285714,True,198.077775 +25696c0b-e73c-489b-9e3e-39f809321d9d,zai-org/GLM-4.5-Air-FP8,together_ai,cobol-modernization,6346,5409,11755,918.676874,True,1.0,zai-org/GLM-4.5-Air-FP8,cobol-modernization,918.676874,True,0.4,True,918.676874 +513b7b5c-cc32-4c6a-9a1e-0f995451893c,gpt-5-nano,openai,reverse-engineering,28900,14473,43373,1803.218777,False,0.0,gpt-5-nano,reverse-engineering,1803.218777,False,0.0,False,1803.218777 +2f1bded6-3414-4bbc-af0c-4b827ae50b49,gpt-5,openai,openssl-selfsigned-cert,2319,1393,3712,134.891475,True,1.0,gpt-5,openssl-selfsigned-cert,134.891475,True,1.0,True,134.891475 +dcfd5012-3732-4bad-ae3f-bb9b15aa4d0d,gemini-2.5-flash,gemini,openssl-selfsigned-cert,2201,1733,3934,96.088008,False,0.0,gemini-2.5-flash,openssl-selfsigned-cert,96.088008,False,0.0,False,96.088008 +7e9b0249-63a0-4493-b28a-b435613bb6df,gpt-5-nano,openai,form-filling,10607,11478,22085,907.71556,False,0.0,gpt-5-nano,form-filling,907.71556,False,0.6,False,907.71556 +a7434d54-fed2-489c-aaf5-de9db27742a5,moonshotai/Kimi-K2-Instruct-0905,together_ai,circuit-fibsqrt,29112,33250,62362,3615.434352,False,0.0,moonshotai/Kimi-K2-Instruct-0905,circuit-fibsqrt,3615.434352,False,0.0,False,3615.434352 +bf0a34aa-4602-4f5b-ab8f-30df5026db01,OpenAI/gpt-oss-20B,together_ai,distribution-search,790,1581,2371,72.697168,False,0.0,OpenAI/gpt-oss-20B,distribution-search,72.697168,False,0.0,False,72.697168 +e6454828-7cc7-476b-927e-e01c78d831c4,gpt-5,openai,cancel-async-tasks,2501,1799,4300,140.779789,True,1.0,gpt-5,cancel-async-tasks,140.779789,True,0.6,True,140.779789 +a62d0bea-a605-47cd-a544-7404e67b5b71,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,crack-7z-hash,9978,3057,13035,534.435145,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,crack-7z-hash,534.435145,False,0.0,False,534.435145 +6f4f0cc9-386f-4f13-9c3a-7ff6266dfe75,gpt-5-mini,openai,fix-ocaml-gc,18473,21093,39566,3600.000779,False,0.0,gpt-5-mini,fix-ocaml-gc,3600.000779,False,0.0,False,3600.000779 +27e63949-b341-40ff-b23e-77f3766addd3,claude-sonnet-4-20250514,anthropic,build-initramfs-qemu,3826,3476,7302,191.329906,False,0.0,claude-sonnet-4-20250514,build-initramfs-qemu,191.329906,False,0.0,False,191.329906 +c753c4a6-cd09-4661-a6cd-1e888f7ddb0d,OpenAI/gpt-oss-20B,together_ai,qemu-alpine-ssh,265,1683,1948,102.47707,False,0.0,OpenAI/gpt-oss-20B,qemu-alpine-ssh,102.47707,False,0.0,False,102.47707 +4772b338-83aa-4288-8a8b-e8312fc64437,deepseek-ai/DeepSeek-V3.1,together_ai,dna-insert,7478,5767,13245,367.339669,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-insert,367.339669,False,0.0,False,367.339669 +d4916c40-e25f-4b8a-bc1c-53ee5faa10e4,deepseek-ai/DeepSeek-V3.1,together_ai,feal-linear-cryptanalysis,25722,24058,49780,1814.528365,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-linear-cryptanalysis,1814.528365,False,0.0,False,1814.528365 +5ea83cc7-e311-4060-aa46-9fc26475888c,OpenAI/gpt-oss-20B,together_ai,password-recovery,2333,5459,7792,183.070605,False,0.0,OpenAI/gpt-oss-20B,password-recovery,183.070605,False,0.0,False,183.070605 +a1c69c39-b122-4744-940c-d1c081a286eb,openai/gpt-oss-120b,together_ai,polyglot-c-py,1460,1628,3088,117.740586,False,0.0,openai/gpt-oss-120b,polyglot-c-py,117.740586,False,0.0,False,117.740586 +b06f5648-447b-4a39-9e86-6a5c4ab33b8c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-cli,4007,1874,5881,160.840025,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-cli,160.840025,False,0.0,False,160.840025 +65793433-8b24-453c-8d2e-343f8ad68ecc,OpenAI/gpt-oss-20B,together_ai,cancel-async-tasks,881,1464,2345,40.721059,False,0.0,OpenAI/gpt-oss-20B,cancel-async-tasks,40.721059,False,0.0,False,40.721059 +b78ba586-46ce-4453-bc32-64c8a4403906,gpt-5-mini,openai,vulnerable-secret,5084,5796,10880,904.559886,False,0.0,gpt-5-mini,vulnerable-secret,904.559886,False,0.4,False,904.559886 +7e8812f1-a339-4fde-9000-e9f444056788,zai-org/GLM-4.5-Air-FP8,together_ai,cobol-modernization,13407,14128,27535,396.241093,False,0.0,zai-org/GLM-4.5-Air-FP8,cobol-modernization,396.241093,False,0.4,False,396.241093 +91597cc2-906a-49f3-870e-f77ca9a3822c,deepseek-ai/DeepSeek-V3.1,together_ai,install-windows-3.11,9328,3524,12852,1306.532762,False,0.0,deepseek-ai/DeepSeek-V3.1,install-windows-3.11,1306.532762,False,0.0,False,1306.532762 +874e3c23-a45e-4e2f-aff6-dc76926431ee,gemini-2.5-flash,gemini,git-leak-recovery,3610,3093,6703,274.338204,True,1.0,gemini-2.5-flash,git-leak-recovery,274.338204,True,0.6,True,274.338204 +97c95118-1ccd-482d-be34-6ef8ebe081de,openai/gpt-oss-120b,together_ai,fix-ocaml-gc,27493,21319,48812,3646.360484,False,0.0,openai/gpt-oss-120b,fix-ocaml-gc,3646.360484,False,0.0,False,3646.360484 +d596ec83-9337-4876-b656-55f1e4d81d4a,openai/gpt-oss-120b,together_ai,financial-document-processor,1717,1177,2894,85.524672,False,0.0,openai/gpt-oss-120b,financial-document-processor,85.524672,False,0.0,False,85.524672 +99c0627c-6e49-4fdb-a230-ac59625cc09c,openai/gpt-oss-120b,together_ai,filter-js-from-html,1472,1542,3014,37.773888,False,0.0,openai/gpt-oss-120b,filter-js-from-html,37.773888,False,0.0,False,37.773888 +472c5afe-743c-4eb6-be36-eb3e2b1bccb6,grok-code-fast-1,xai,filter-js-from-html,1716,879,2595,39.359657,False,0.0,grok-code-fast-1,filter-js-from-html,39.359657,False,0.0,False,39.359657 +1934a47d-4788-4c63-a85c-f9989722939e,moonshotai/Kimi-K2-Instruct-0905,together_ai,crack-7z-hash,9036,3599,12635,290.86407,True,1.0,moonshotai/Kimi-K2-Instruct-0905,crack-7z-hash,290.86407,True,1.0,True,290.86407 +fe0c050a-861a-407c-88b8-b7f067233e18,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,distribution-search,8480,7710,16190,534.762051,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,distribution-search,534.762051,False,0.4,False,534.762051 +e7c99fd9-783f-459b-b8f0-ca5a1c8cbe0d,zai-org/GLM-4.5-Air-FP8,together_ai,reshard-c4-data,18915,15831,34746,657.352434,False,0.0,zai-org/GLM-4.5-Air-FP8,reshard-c4-data,657.352434,False,0.0,False,657.352434 +13e5bc0e-39ea-4aa9-82ab-704f3e182960,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cancel-async-tasks,3637,2926,6563,269.034483,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cancel-async-tasks,269.034483,False,0.6,False,269.034483 +698521b5-5662-4dd0-a19c-d26b80bb331c,gpt-5-nano,openai,pytorch-model-cli,9327,3304,12631,259.063906,False,0.0,gpt-5-nano,pytorch-model-cli,259.063906,False,0.0,False,259.063906 +7bbaed4d-4304-4192-b938-ce14edca0610,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,constraints-scheduling,2945,3286,6231,118.687236,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,constraints-scheduling,118.687236,False,0.0,False,118.687236 +37c36cea-c799-40ba-b8d2-30f80711d9c5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,log-summary-date-ranges,4562,2065,6627,258.871112,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,log-summary-date-ranges,258.871112,False,0.0,False,258.871112 +7aa15593-8d6e-426f-9295-1df9030a9729,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-with-gcov,12757,3880,16637,324.311196,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-with-gcov,324.311196,False,0.4,False,324.311196 +32bf7861-fca6-449d-a9d0-94309bc8ae1c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,largest-eigenval,9138,6206,15344,435.740243,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,largest-eigenval,435.740243,False,0.0,False,435.740243 +00a50e6c-0380-4a26-a608-9a5f7d36f3bc,gpt-5-mini,openai,schemelike-metacircular-eval,31123,35134,66257,2410.55378,False,0.0,gpt-5-mini,schemelike-metacircular-eval,2410.55378,False,0.0,False,2410.55378 +4d7eb9bf-cb85-4a1d-902d-409a93a062f5,deepseek-ai/DeepSeek-V3.1,together_ai,port-compressor,49510,32514,82024,3640.213913,False,0.0,deepseek-ai/DeepSeek-V3.1,port-compressor,3640.213913,False,0.0,False,3640.213913 +67494241-47ce-4f91-b593-52dcc57f4f62,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-c-py,34779,19686,54465,912.715277,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-c-py,912.715277,False,0.0,False,912.715277 +76d25d68-9482-42df-b78b-bc72905fccb5,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-windows-3.11,9519,6204,15723,1271.822643,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-windows-3.11,1271.822643,False,0.0,False,1271.822643 +43511834-5e9a-4084-afc8-cd5d47201c33,gpt-5-mini,openai,count-dataset-tokens,11207,7015,18222,756.869092,False,0.0,gpt-5-mini,count-dataset-tokens,756.869092,False,0.0,False,756.869092 +445d761f-0bf4-4e5d-ab0b-37c4a733164c,gpt-5,openai,chess-best-move,20000,9204,29204,901.844325,False,0.0,gpt-5,chess-best-move,901.844325,False,0.0,False,901.844325 +f5283f4b-8974-43f7-a40c-ee5fa96ec462,grok-code-fast-1,xai,filter-js-from-html,1146,525,1671,68.472217,False,0.0,grok-code-fast-1,filter-js-from-html,68.472217,False,0.0,False,68.472217 +dce71606-3c3d-44ec-82c9-2ff2b6b90017,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,video-processing,11421,12053,23474,734.966628,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,video-processing,734.966628,False,0.0,False,734.966628 +6bf2a2bd-d3d6-4179-9a29-3e7afb95dad9,claude-sonnet-4-20250514,anthropic,regex-log,2179,1770,3949,252.274683,True,1.0,claude-sonnet-4-20250514,regex-log,252.274683,True,0.8,True,252.274683 +7aece6b0-620a-43e7-9e71-3097b912639b,moonshotai/Kimi-K2-Instruct-0905,together_ai,circuit-fibsqrt,18368,20645,39013,1391.303329,False,0.0,moonshotai/Kimi-K2-Instruct-0905,circuit-fibsqrt,1391.303329,False,0.0,False,1391.303329 +51f85e02-5b15-4f3d-9f3d-0ebd155c377a,gpt-5,openai,chess-best-move,16659,6488,23147,924.433937,False,0.0,gpt-5,chess-best-move,924.433937,False,0.0,False,924.433937 +5fe15e49-cfc2-4b14-ba17-7e3b5f2df5a3,grok-code-fast-1,xai,fix-git,8086,3875,11961,852.275154,False,0.0,grok-code-fast-1,fix-git,852.275154,False,0.2,False,852.275154 +beb42e90-b6e2-4448-b750-dec215da40a8,claude-sonnet-4-20250514,anthropic,video-processing,7134,5449,12583,595.645043,False,0.0,claude-sonnet-4-20250514,video-processing,595.645043,False,0.0,False,595.645043 +b8c14b87-b5b9-4737-9d9b-35fa732fd621,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,git-leak-recovery,3450,2816,6266,411.623186,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,git-leak-recovery,411.623186,True,1.0,True,411.623186 +7c9da7dc-7917-4261-befd-caebb15cd116,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,crack-7z-hash,3623,1879,5502,68.802228,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,crack-7z-hash,68.802228,False,0.0,False,68.802228 +0d1996b6-6af8-447b-9518-3aa08cd94470,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-mips-interpreter,26161,8580,34741,1105.655288,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-mips-interpreter,1105.655288,False,0.0,False,1105.655288 +b59b9cb4-f824-4081-b887-928ae94f3714,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,port-compressor,57367,43947,101314,3023.158004,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,port-compressor,3023.158004,False,0.0,False,3023.158004 +8253e46b-2d9d-4330-91c2-a9b4e7f32f73,openai/gpt-oss-120b,together_ai,nginx-request-logging,3844,1702,5546,134.591175,False,0.0,openai/gpt-oss-120b,nginx-request-logging,134.591175,False,0.4,False,134.591175 +a6ffc56f-5d72-4555-a5a7-8d81dba526a4,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,adaptive-rejection-sampler,9200,1124,10324,98.180834,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,adaptive-rejection-sampler,98.180834,False,0.0,False,98.180834 +9258c28c-fc1f-409e-99b6-83c31c426301,grok-4-0709,xai,git-leak-recovery,1297,689,1986,235.720213,True,1.0,grok-4-0709,git-leak-recovery,235.720213,True,0.4,True,235.720213 +57bc73e1-df70-46eb-8427-ba59efd4b9af,grok-code-fast-1,xai,filter-js-from-html,1253,745,1998,367.982357,False,0.0,grok-code-fast-1,filter-js-from-html,367.982357,False,0.0,False,367.982357 +2ffd3819-f3cc-41e8-8090-851fceb5b36d,gpt-5,openai,fix-ocaml-gc,21567,22973,44540,3600.790072,False,0.0,gpt-5,fix-ocaml-gc,3600.790072,False,0.0,False,3600.790072 +71da4ddc-57ee-44be-9ec5-905d3db1cd68,gemini-2.5-pro,gemini,reverse-engineering,11681,4950,16631,1828.588204,False,0.0,gemini-2.5-pro,reverse-engineering,1828.588204,False,0.0,False,1828.588204 +36687ea4-d7af-4cba-90d2-aee7f7799c6d,claude-opus-4-1-20250805,anthropic,hf-model-inference,5292,3206,8498,151.56206,False,0.0,claude-opus-4-1-20250805,hf-model-inference,151.56206,False,0.25,False,151.56206 +3da85369-7bca-4ffb-a41a-52b6834ad301,gpt-5,openai,qemu-startup,3442,5178,8620,905.013883,True,1.0,gpt-5,qemu-startup,905.013883,True,0.8,True,905.013883 +ace5adf7-b5aa-493d-80cd-60b0824e7b52,deepseek-ai/DeepSeek-V3.1,together_ai,extract-elf,9995,1064,11059,147.410969,True,1.0,deepseek-ai/DeepSeek-V3.1,extract-elf,147.410969,True,0.6,True,147.410969 +35e5a5fa-d458-46bc-931d-c5497b6f9c22,deepseek-ai/DeepSeek-V3.1,together_ai,torch-tensor-parallelism,4829,2489,7318,269.647752,False,0.0,deepseek-ai/DeepSeek-V3.1,torch-tensor-parallelism,269.647752,False,0.0,False,269.647752 +91a43c48-4e40-43b4-b817-1117a64ddd41,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-leaderboard,18910,5876,24786,850.794505,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-leaderboard,850.794505,False,0.0,False,850.794505 +17a91017-f88a-4642-abd9-af2d7d03aa99,claude-opus-4-1-20250805,anthropic,circuit-fibsqrt,19842,16585,36427,518.937269,False,0.0,claude-opus-4-1-20250805,circuit-fibsqrt,518.937269,False,0.0,False,518.937269 +4330392c-1bb9-4051-b220-b1a81b8742b1,openai/gpt-oss-120b,together_ai,write-compressor,2454,976,3430,1224.669908,False,0.0,openai/gpt-oss-120b,write-compressor,1224.669908,False,0.0,False,1224.669908 +b8424f88-4c20-4594-ab70-baa6344ae901,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-cli,8369,4036,12405,655.597516,False,0.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-cli,655.597516,False,0.0,False,655.597516 +b2f5c470-3a1e-4068-9126-9f7b9fc91d2d,zai-org/GLM-4.5-Air-FP8,together_ai,openssl-selfsigned-cert,1879,1436,3315,49.326186,False,0.0,zai-org/GLM-4.5-Air-FP8,openssl-selfsigned-cert,49.326186,False,0.0,False,49.326186 +bc3ae8b5-74fc-4454-9b09-a9ca11863b7f,claude-opus-4-1-20250805,anthropic,break-filter-js-from-html,13045,15196,28241,1433.311452,False,0.0,claude-opus-4-1-20250805,break-filter-js-from-html,1433.311452,False,0.2222222222222222,False,1433.311452 +5a5234be-8a8f-442c-88c7-a2ad23935027,openai/gpt-oss-120b,together_ai,polyglot-c-py,4328,6743,11071,276.857032,False,0.0,openai/gpt-oss-120b,polyglot-c-py,276.857032,False,0.0,False,276.857032 +fd315990-06cb-451a-972d-527e2b67435f,gpt-5,openai,tune-mjcf,6264,4369,10633,932.103897,False,0.0,gpt-5,tune-mjcf,932.103897,False,0.0,False,932.103897 +54c0dcde-65f0-4890-a479-ae42f67f6764,deepseek-ai/DeepSeek-V3.1,together_ai,gpt2-codegolf,11001,12825,23826,901.040115,False,0.0,deepseek-ai/DeepSeek-V3.1,gpt2-codegolf,901.040115,False,0.0,False,901.040115 +58a73405-8b97-4458-89da-287c9dc561e1,deepseek-ai/DeepSeek-V3.1,together_ai,install-klee-minimal,15903,2261,18164,948.324873,False,0.0,deepseek-ai/DeepSeek-V3.1,install-klee-minimal,948.324873,False,0.0,False,948.324873 +afb23def-2fbe-4d50-949c-e47b1936dab8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,model-extraction-relu-logits,1523,941,2464,278.303463,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,model-extraction-relu-logits,278.303463,False,0.0,False,278.303463 +dda6bfb4-6e0e-487c-b3f8-cb59e9f0fbf6,gpt-5,openai,pytorch-model-recovery,12547,19993,32540,900.001126,False,0.0,gpt-5,pytorch-model-recovery,900.001126,False,0.4285714285714285,False,900.001126 +1c80dd90-f60e-4da4-b241-9f2f60812750,gpt-5,openai,dna-insert,961,2950,3911,470.679608,False,0.0,gpt-5,dna-insert,470.679608,False,0.0,False,470.679608 +fdfc18b9-f834-45b2-b62f-56efca017ca7,gpt-5,openai,adaptive-rejection-sampler,6902,17724,24626,902.826155,False,0.0,gpt-5,adaptive-rejection-sampler,902.826155,False,0.4,False,902.826155 +c464dd5f-0dd3-40cc-83fc-4322351e787f,gpt-5,openai,configure-git-webserver,5767,2368,8135,651.456662,True,1.0,gpt-5,configure-git-webserver,651.456662,True,1.0,True,651.456662 +a2556c43-39f5-42f9-b9c5-fdee28dda496,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,reverse-engineering,14009,9315,23324,715.187133,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reverse-engineering,715.187133,False,0.0,False,715.187133 +7bceb0f5-9dbd-4804-a5b0-4887835d8af8,gemini-2.5-flash,gemini,log-summary-date-ranges,2462,3833,6295,251.721092,False,0.0,gemini-2.5-flash,log-summary-date-ranges,251.721092,False,0.0,False,251.721092 +32853f59-59e8-42ae-acd8-6ef1cfb2e82d,claude-sonnet-4-20250514,anthropic,dna-assembly,10337,5989,16326,735.313826,False,0.0,claude-sonnet-4-20250514,dna-assembly,735.313826,False,0.0,False,735.313826 +6ea7ae37-00e1-4459-a775-a49cbdd7fcf2,OpenAI/gpt-oss-20B,together_ai,sqlite-db-truncate,920,1404,2324,246.880051,False,0.0,OpenAI/gpt-oss-20B,sqlite-db-truncate,246.880051,False,0.0,False,246.880051 +d7cde291-3d23-438e-ad31-2c51625e1123,moonshotai/Kimi-K2-Instruct-0905,together_ai,model-extraction-relu-logits,8795,8136,16931,843.14087,True,1.0,moonshotai/Kimi-K2-Instruct-0905,model-extraction-relu-logits,843.14087,True,0.4,True,843.14087 +08c3fca4-5ccf-4f35-8de4-8515f8ca0e6c,openai/gpt-oss-120b,together_ai,financial-document-processor,10902,5192,16094,360.900964,False,0.0,openai/gpt-oss-120b,financial-document-processor,360.900964,False,0.0,False,360.900964 +696ff5d1-b026-4504-a0e2-f6202d0f75d3,gpt-5-nano,openai,mteb-leaderboard,31802,43007,74809,3600.029678,False,0.0,gpt-5-nano,mteb-leaderboard,3600.029678,False,0.0,False,3600.029678 +44a6d18f-41ae-448b-ac70-aa2b98482df2,deepseek-ai/DeepSeek-V3.1,together_ai,tune-mjcf,7014,4253,11267,1005.474516,False,0.0,deepseek-ai/DeepSeek-V3.1,tune-mjcf,1005.474516,False,0.0,False,1005.474516 +d4d717d4-2fae-4fab-80b8-112fe58968c1,deepseek-ai/DeepSeek-V3.1,together_ai,count-dataset-tokens,13055,2499,15554,919.248923,False,0.0,deepseek-ai/DeepSeek-V3.1,count-dataset-tokens,919.248923,False,0.0,False,919.248923 +85bded94-4836-4fbb-8f52-e9db02b46261,grok-code-fast-1,xai,configure-git-webserver,4491,646,5137,97.397409,False,0.0,grok-code-fast-1,configure-git-webserver,97.397409,False,0.0,False,97.397409 +297ee20b-9af8-4c32-ba1c-277a4e76b271,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,adaptive-rejection-sampler,5500,1154,6654,900.032628,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,adaptive-rejection-sampler,900.032628,False,0.0,False,900.032628 +0c0067e5-be3d-4c9a-b1fd-7beaf3e13183,gpt-5-nano,openai,filter-js-from-html,3554,4612,8166,676.114883,False,0.0,gpt-5-nano,filter-js-from-html,676.114883,False,0.0,False,676.114883 +14542b18-5878-4215-a87f-575e8b0d57e3,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-retrieve,3784,2626,6410,326.776511,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-retrieve,326.776511,False,0.0,False,326.776511 +fe88016b-2e99-4673-bbf0-94506a64653b,claude-opus-4-1-20250805,anthropic,vulnerable-secret,6532,6055,12587,318.515285,True,1.0,claude-opus-4-1-20250805,vulnerable-secret,318.515285,True,0.625,True,318.515285 +5828f51b-7e9a-49c5-95cb-5975c95a317c,claude-sonnet-4-20250514,anthropic,git-leak-recovery,3128,3324,6452,376.98746,True,1.0,claude-sonnet-4-20250514,git-leak-recovery,376.98746,True,1.0,True,376.98746 +d23f9451-2e4a-40ed-a04c-7b567b8f2b80,gemini-2.5-flash,gemini,sqlite-with-gcov,6598,1505,8103,203.85763,True,1.0,gemini-2.5-flash,sqlite-with-gcov,203.85763,True,0.2,True,203.85763 +8eac36a4-c736-436e-b72e-730f6cbc55fe,grok-code-fast-1,xai,video-processing,2015,1448,3463,91.194466,False,0.0,grok-code-fast-1,video-processing,91.194466,False,0.0,False,91.194466 +ef12d1b0-3bae-4248-8b0e-3e405a79d1f1,gpt-5,openai,pytorch-model-recovery,12770,11924,24694,901.025254,False,0.0,gpt-5,pytorch-model-recovery,901.025254,False,0.4285714285714285,False,901.025254 +afbe9715-3b4f-4f04-b8a0-c9eec4bbeba7,gpt-5-mini,openai,prove-plus-comm,1437,893,2330,100.040451,False,0.0,gpt-5-mini,prove-plus-comm,100.040451,False,0.6,False,100.040451 +8ad142c9-01e7-46b4-9230-6c982b8e8741,claude-opus-4-1-20250805,anthropic,password-recovery,8474,3640,12114,869.559788,True,1.0,claude-opus-4-1-20250805,password-recovery,869.559788,True,0.5555555555555556,True,869.559788 +2ef28364-d183-4268-bc32-6ed4c27ffc21,gpt-5,openai,mteb-retrieve,2174,1289,3463,187.925343,False,0.0,gpt-5,mteb-retrieve,187.925343,False,0.0,False,187.925343 +bfc30cf3-c2d1-484f-bd40-5cba87c9c021,OpenAI/gpt-oss-20B,together_ai,feal-linear-cryptanalysis,4689,14594,19283,1836.216547,False,0.0,OpenAI/gpt-oss-20B,feal-linear-cryptanalysis,1836.216547,False,0.0,False,1836.216547 +1ed5ee2b-0ca3-4927-9e1c-ff1359ba684c,gpt-5,openai,qemu-alpine-ssh,1373,1208,2581,420.593761,False,0.0,gpt-5,qemu-alpine-ssh,420.593761,False,0.1666666666666666,False,420.593761 +d3a19304-a725-4868-9bc0-0df4651d34d2,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sanitize-git-repo,11751,1677,13428,372.027776,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sanitize-git-repo,372.027776,False,0.0,False,372.027776 +59c3d6eb-b706-4584-9e60-089c5be59b82,gpt-5,openai,regex-log,1388,1596,2984,168.70928,True,1.0,gpt-5,regex-log,168.70928,True,1.0,True,168.70928 +9ee16c08-cecb-46e2-9eaa-8eb39b2db039,claude-sonnet-4-20250514,anthropic,nginx-request-logging,5881,3769,9650,448.836396,True,1.0,claude-sonnet-4-20250514,nginx-request-logging,448.836396,True,1.0,True,448.836396 +04f840a0-3164-4f41-95e2-356df2c198bd,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing,21082,20456,41538,1803.631786,False,0.0,deepseek-ai/DeepSeek-V3.1,path-tracing,1803.631786,False,0.0,False,1803.631786 +3a7177c5-e63f-4db2-a6d0-192a4d9eef02,deepseek-ai/DeepSeek-V3.1,together_ai,nginx-request-logging,4572,2377,6949,147.721254,True,1.0,deepseek-ai/DeepSeek-V3.1,nginx-request-logging,147.721254,True,0.4,True,147.721254 +5bfdf8c1-a281-4c50-b4b0-74ca6e15b4e8,OpenAI/gpt-oss-20B,together_ai,sanitize-git-repo,2612,979,3591,102.413541,False,0.0,OpenAI/gpt-oss-20B,sanitize-git-repo,102.413541,False,0.0,False,102.413541 +e59a7ba4-c580-4bea-81d5-49485b946047,moonshotai/Kimi-K2-Instruct-0905,together_ai,log-summary-date-ranges,7881,2341,10222,127.136382,True,1.0,moonshotai/Kimi-K2-Instruct-0905,log-summary-date-ranges,127.136382,True,0.8,True,127.136382 +6b753aee-fa73-47a3-8cdc-f5db2db353b2,OpenAI/gpt-oss-20B,together_ai,write-compressor,480,1925,2405,310.212859,False,0.0,OpenAI/gpt-oss-20B,write-compressor,310.212859,False,0.0,False,310.212859 +85c0ff26-265a-4210-b780-bb3db15ff8ea,gemini-2.5-flash,gemini,build-pmars,18873,5634,24507,271.468212,True,1.0,gemini-2.5-flash,build-pmars,271.468212,True,0.8,True,271.468212 +76f43fa6-deb4-4bd3-bc2b-239a45394e7f,OpenAI/gpt-oss-20B,together_ai,train-fasttext,6598,44258,50856,3627.670412,False,0.0,OpenAI/gpt-oss-20B,train-fasttext,3627.670412,False,0.0,False,3627.670412 +b1ad8645-9ee0-45e0-aef7-a491a07d3393,grok-4-0709,xai,make-mips-interpreter,12081,14628,26709,1809.511643,False,0.0,grok-4-0709,make-mips-interpreter,1809.511643,False,0.0,False,1809.511643 +a7b3dede-597d-4ea7-8ba0-905d43e93c23,moonshotai/Kimi-K2-Instruct-0905,together_ai,large-scale-text-editing,3367,5260,8627,591.376498,False,0.0,moonshotai/Kimi-K2-Instruct-0905,large-scale-text-editing,591.376498,False,0.0,False,591.376498 +19c5e3de-69c6-483c-ae52-714e6a95b1b6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,merge-diff-arc-agi-task,15513,8529,24042,725.307267,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,merge-diff-arc-agi-task,725.307267,False,0.4,False,725.307267 +77befbd9-2073-4e41-9c2c-f79641ad5a09,grok-4-0709,xai,reshard-c4-data,4282,2699,6981,901.086579,False,0.0,grok-4-0709,reshard-c4-data,901.086579,False,0.0,False,901.086579 +0d3715ad-cb91-4565-b152-20ba83aaa584,gpt-5-nano,openai,build-pov-ray,6785,19270,26055,6385.659199,False,0.0,gpt-5-nano,build-pov-ray,6385.659199,False,0.0,False,6385.659199 +63abacd9-b87c-477c-9ad5-d18cdbf1ebaf,gpt-5-mini,openai,write-compressor,12574,9223,21797,793.427209,False,0.0,gpt-5-mini,write-compressor,793.427209,False,0.0,False,793.427209 +f49a9401-7489-4781-87bc-d4ef02469b86,zai-org/GLM-4.5-Air-FP8,together_ai,make-mips-interpreter,19457,14849,34306,673.881244,False,0.0,zai-org/GLM-4.5-Air-FP8,make-mips-interpreter,673.881244,False,0.0,False,673.881244 +8b85ef64-6d93-4709-8389-ae308d21f572,gpt-5-nano,openai,large-scale-text-editing,3404,6064,9468,1201.750252,False,0.0,gpt-5-nano,large-scale-text-editing,1201.750252,False,0.0,False,1201.750252 +37570c15-1821-4744-9b4b-e6025a08e3b5,deepseek-ai/DeepSeek-V3.1,together_ai,form-filling,7771,5862,13633,263.519789,True,1.0,deepseek-ai/DeepSeek-V3.1,form-filling,263.519789,True,0.8,True,263.519789 +0672684b-ebda-4e1d-acc5-52d9e356988e,gpt-5-nano,openai,pytorch-model-recovery,22400,26296,48696,900.016947,False,0.0,gpt-5-nano,pytorch-model-recovery,900.016947,False,0.0,False,900.016947 +029e4ac6-be71-436e-b58b-681bec0d33f1,grok-code-fast-1,xai,mteb-leaderboard,929,506,1435,54.017572,False,0.0,grok-code-fast-1,mteb-leaderboard,54.017572,False,0.0,False,54.017572 +a4d1244e-5523-47f6-bdb3-9105806e6822,gpt-5-nano,openai,sanitize-git-repo,9458,9439,18897,902.627943,False,0.0,gpt-5-nano,sanitize-git-repo,902.627943,False,0.0,False,902.627943 +5db2f59e-165f-4634-82d7-fec45a0a9bcf,gemini-2.5-flash,gemini,circuit-fibsqrt,23852,53086,76938,3600.288436,False,0.0,gemini-2.5-flash,circuit-fibsqrt,3600.288436,False,0.0,False,3600.288436 +7c243181-72d3-4a7f-b77e-786e6f078457,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-c-py,23272,29194,52466,919.331625,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-c-py,919.331625,False,0.0,False,919.331625 +71928e96-c486-4790-8d04-2a14cf0a44ac,claude-sonnet-4-20250514,anthropic,build-pov-ray,13432,9903,23335,2059.80543,False,0.0,claude-sonnet-4-20250514,build-pov-ray,2059.80543,False,0.6,False,2059.80543 +1083dc22-2909-4d28-9026-e515d6cf8efe,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-recovery,2902,2626,5528,242.533156,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-recovery,242.533156,False,0.0,False,242.533156 +eceb3b8d-e720-4f5a-8312-e29233f9626a,moonshotai/Kimi-K2-Instruct-0905,together_ai,extract-elf,8964,6122,15086,355.680177,False,0.0,moonshotai/Kimi-K2-Instruct-0905,extract-elf,355.680177,False,0.6,False,355.680177 +c5d3d342-c9fb-45e8-b6c9-7112ff160da8,claude-sonnet-4-20250514,anthropic,crack-7z-hash,10682,5003,15685,664.830349,True,1.0,claude-sonnet-4-20250514,crack-7z-hash,664.830349,True,1.0,True,664.830349 +e1adb003-860d-4701-bf14-c4b12bea0670,claude-sonnet-4-20250514,anthropic,make-mips-interpreter,23313,17076,40389,1831.935171,False,0.0,claude-sonnet-4-20250514,make-mips-interpreter,1831.935171,False,0.0,False,1831.935171 +034010f8-5d38-4119-b596-c4a1e25a8cc6,gpt-5,openai,hf-model-inference,5120,2105,7225,304.240438,True,1.0,gpt-5,hf-model-inference,304.240438,True,1.0,True,304.240438 +24472457-f34e-4074-aa41-aa33fd178913,grok-code-fast-1,xai,nginx-request-logging,3260,955,4215,135.602007,False,0.0,grok-code-fast-1,nginx-request-logging,135.602007,False,0.0,False,135.602007 +ce4b5553-f0fa-46a9-a805-7a1b280a580f,grok-code-fast-1,xai,constraints-scheduling,3639,3706,7345,283.639193,False,0.0,grok-code-fast-1,constraints-scheduling,283.639193,False,0.8,False,283.639193 +07020d61-dab7-44d6-b40b-48781601f357,gemini-2.5-pro,gemini,polyglot-rust-c,2932,2950,5882,959.010598,False,0.0,gemini-2.5-pro,polyglot-rust-c,959.010598,False,0.0,False,959.010598 +5f5500ce-d56c-42ec-8114-7abb5398645c,gpt-5,openai,git-leak-recovery,6578,7043,13621,901.331757,False,0.0,gpt-5,git-leak-recovery,901.331757,False,0.7142857142857143,False,901.331757 +3573a9b3-362a-4a88-83bf-babc2e692a3c,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing-reverse,31839,20305,52144,1403.807946,False,0.0,deepseek-ai/DeepSeek-V3.1,path-tracing-reverse,1403.807946,False,0.2,False,1403.807946 +15c0dbd1-92fa-4797-b9de-276d837c204a,zai-org/GLM-4.5-Air-FP8,together_ai,code-from-image,14698,11444,26142,584.150479,False,0.0,zai-org/GLM-4.5-Air-FP8,code-from-image,584.150479,False,0.2,False,584.150479 +1167ddfe-39da-4ce6-b207-748adeb1f74d,gpt-5,openai,reverse-engineering,9511,11916,21427,1800.070388,False,0.0,gpt-5,reverse-engineering,1800.070388,False,0.6666666666666666,False,1800.070388 +0448e7e9-533e-4e5c-833a-5e2f0f0812c6,claude-opus-4-1-20250805,anthropic,configure-git-webserver,6696,2391,9087,99.638185,True,1.0,claude-opus-4-1-20250805,configure-git-webserver,99.638185,True,0.625,True,99.638185 +c9ddcf11-fd31-42b7-8145-25d70f524a1e,claude-opus-4-1-20250805,anthropic,reverse-engineering,49467,47079,96546,1838.021957,False,0.0,claude-opus-4-1-20250805,reverse-engineering,1838.021957,False,0.0,False,1838.021957 +72538fad-95e1-44a5-82e5-0f0f6aebabbc,gpt-5-nano,openai,torch-tensor-parallelism,5542,9900,15442,914.847544,False,0.0,gpt-5-nano,torch-tensor-parallelism,914.847544,False,0.0,False,914.847544 +6b16f7be-5916-46a1-882b-efe399c166cf,gpt-5-mini,openai,fix-code-vulnerability,6674,7833,14507,900.450205,False,0.0,gpt-5-mini,fix-code-vulnerability,900.450205,False,0.0,False,900.450205 +327ce27f-451c-41c8-af2e-5d9e53a71ae3,gpt-5-nano,openai,merge-diff-arc-agi-task,8939,5842,14781,900.947232,False,0.0,gpt-5-nano,merge-diff-arc-agi-task,900.947232,False,0.2,False,900.947232 +db55bf01-f713-42c4-a6c4-787628b7e419,gpt-5-mini,openai,pytorch-model-recovery,11055,9180,20235,825.620966,False,0.0,gpt-5-mini,pytorch-model-recovery,825.620966,False,0.0,False,825.620966 +efe50b4b-77d7-4521-8cd2-cd52fd924e57,moonshotai/Kimi-K2-Instruct-0905,together_ai,log-summary-date-ranges,9867,4082,13949,272.706163,True,1.0,moonshotai/Kimi-K2-Instruct-0905,log-summary-date-ranges,272.706163,True,0.8,True,272.706163 +3433962e-d8b6-47c9-b107-27c9d4903e31,gemini-2.5-flash,gemini,configure-git-webserver,5099,1147,6246,493.917429,False,0.0,gemini-2.5-flash,configure-git-webserver,493.917429,False,0.0,False,493.917429 +3f84f3d4-9993-4a5a-8b2a-fa35fb20b030,gemini-2.5-pro,gemini,dna-assembly,2855,3970,6825,269.538427,False,0.0,gemini-2.5-pro,dna-assembly,269.538427,False,0.0,False,269.538427 +9b6acff1-3b66-4167-a07c-7ecfd3ad2819,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,circuit-fibsqrt,1742,2578,4320,131.184082,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,circuit-fibsqrt,131.184082,False,0.0,False,131.184082 +81b55edd-b648-4967-aefd-4559416e5ca0,zai-org/GLM-4.5-Air-FP8,together_ai,build-cython-ext,6679,2432,9111,902.36444,False,0.0,zai-org/GLM-4.5-Air-FP8,build-cython-ext,902.36444,False,0.0,False,902.36444 +5b0725c5-1ab5-4b5d-a00f-150016e2fcdb,OpenAI/gpt-oss-20B,together_ai,constraints-scheduling,231,650,881,206.900755,False,0.0,OpenAI/gpt-oss-20B,constraints-scheduling,206.900755,False,0.2,False,206.900755 +502c635d-4bef-4b74-b097-662d75cd3bcb,grok-4-0709,xai,tune-mjcf,4892,5249,10141,903.215264,False,0.0,grok-4-0709,tune-mjcf,903.215264,False,0.0,False,903.215264 +ee0e0171-41f4-4a7b-bdab-d19d1cb6fd0b,gpt-5-nano,openai,form-filling,24500,29745,54245,900.243668,True,1.0,gpt-5-nano,form-filling,900.243668,True,0.6,True,900.243668 +55b56911-006c-4204-8ee1-ebb73044ccca,zai-org/GLM-4.5-Air-FP8,together_ai,run-pdp11-code,1312,1599,2911,46.218415,False,0.0,zai-org/GLM-4.5-Air-FP8,run-pdp11-code,46.218415,False,0.0,False,46.218415 +2afa9d84-5233-462a-b757-858c82a1db65,grok-4-0709,xai,extract-elf,1588,980,2568,384.71568,True,1.0,grok-4-0709,extract-elf,384.71568,True,0.2,True,384.71568 +6b942f33-a4d6-43c2-a4fd-4c43aa0a3f2f,deepseek-ai/DeepSeek-V3.1,together_ai,log-summary-date-ranges,9006,3037,12043,296.870361,True,1.0,deepseek-ai/DeepSeek-V3.1,log-summary-date-ranges,296.870361,True,0.4,True,296.870361 +87411c9e-fe61-4e2a-b3a6-bf00a76f97de,gpt-5-mini,openai,mteb-leaderboard,2739,4132,6871,271.216223,False,0.0,gpt-5-mini,mteb-leaderboard,271.216223,False,0.0,False,271.216223 +3b395af5-5331-46a1-a1ff-12a74bf2941e,gpt-5-nano,openai,sqlite-db-truncate,3941,4473,8414,308.390938,False,0.0,gpt-5-nano,sqlite-db-truncate,308.390938,False,0.0,False,308.390938 +7b3ba137-5dfd-4b78-ac8a-e1147a2b7ccf,zai-org/GLM-4.5-Air-FP8,together_ai,openssl-selfsigned-cert,2327,2465,4792,58.879297,False,0.0,zai-org/GLM-4.5-Air-FP8,openssl-selfsigned-cert,58.879297,False,0.0,False,58.879297 +6f998f7a-7b71-41f9-ae98-cce082d8cd38,claude-opus-4-1-20250805,anthropic,model-extraction-relu-logits,6278,5535,11813,266.633976,False,0.0,claude-opus-4-1-20250805,model-extraction-relu-logits,266.633976,False,0.0,False,266.633976 +6bc7e090-9c8e-45ad-a37e-b4087fa84c5a,zai-org/GLM-4.5-Air-FP8,together_ai,chess-best-move,11502,8662,20164,815.436121,False,0.0,zai-org/GLM-4.5-Air-FP8,chess-best-move,815.436121,False,0.0,False,815.436121 +05bbbced-8720-43a2-adef-4c5b1a365b3f,moonshotai/Kimi-K2-Instruct-0905,together_ai,bn-fit-modify,16588,7381,23969,498.761609,False,0.0,moonshotai/Kimi-K2-Instruct-0905,bn-fit-modify,498.761609,False,0.0,False,498.761609 +0ef2c5d7-e28b-4c55-8649-5935e00e81d8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-linear-cryptanalysis,3291,2039,5330,308.497992,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-linear-cryptanalysis,308.497992,False,0.0,False,308.497992 +7b2234a6-f38f-4ffb-9fe4-374651004adc,OpenAI/gpt-oss-20B,together_ai,form-filling,1149,1180,2329,187.701452,False,0.0,OpenAI/gpt-oss-20B,form-filling,187.701452,False,0.0,False,187.701452 +9b2bc8be-0cdf-408f-a68d-f2ce61857c7d,claude-sonnet-4-20250514,anthropic,tune-mjcf,11482,10796,22278,903.328349,False,0.0,claude-sonnet-4-20250514,tune-mjcf,903.328349,False,0.2,False,903.328349 +c401a030-7ffd-4c07-a2b3-d7bc3e35ff5a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,bn-fit-modify,18245,5366,23611,1059.54132,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,bn-fit-modify,1059.54132,False,0.0,False,1059.54132 +0ec63e4d-e64b-4faf-905e-11f4429ba99a,gpt-5-nano,openai,path-tracing-reverse,6352,2817,9169,197.725017,False,0.0,gpt-5-nano,path-tracing-reverse,197.725017,False,0.0,False,197.725017 +53fbbe87-b97e-4c9f-9593-ff96a1d4ad89,gemini-2.5-flash,gemini,make-mips-interpreter,22823,55492,78315,1814.779469,False,0.0,gemini-2.5-flash,make-mips-interpreter,1814.779469,False,0.0,False,1814.779469 +59f7fa95-f3be-4423-84b3-734348f6ff66,zai-org/GLM-4.5-Air-FP8,together_ai,feal-differential-cryptanalysis,1847,2112,3959,171.561258,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-differential-cryptanalysis,171.561258,False,0.0,False,171.561258 +3ec0518d-d1e2-4246-9c27-c003aa02591b,zai-org/GLM-4.5-Air-FP8,together_ai,large-scale-text-editing,9340,12106,21446,1229.003979,False,0.0,zai-org/GLM-4.5-Air-FP8,large-scale-text-editing,1229.003979,False,0.0,False,1229.003979 +422efa4f-9373-49fd-8fc3-304fc208bda5,gemini-2.5-flash,gemini,count-dataset-tokens,11342,7146,18488,662.968065,False,0.0,gemini-2.5-flash,count-dataset-tokens,662.968065,False,0.0,False,662.968065 +b6726919-cf21-47fd-9940-e26eb93b98b2,claude-sonnet-4-20250514,anthropic,run-pdp11-code,5465,5827,11292,1067.624187,False,0.0,claude-sonnet-4-20250514,run-pdp11-code,1067.624187,False,0.0,False,1067.624187 +f5f6e727-433e-47ca-9ae0-e83a5dc75a34,deepseek-ai/DeepSeek-V3.1,together_ai,train-fasttext,22393,9846,32239,1893.742171,False,0.0,deepseek-ai/DeepSeek-V3.1,train-fasttext,1893.742171,False,0.0,False,1893.742171 +42850ca1-2721-48a4-9b6b-0f8038c9dc04,gpt-5-mini,openai,hf-model-inference,2618,1983,4601,245.669061,False,0.0,gpt-5-mini,hf-model-inference,245.669061,False,0.8,False,245.669061 +4e745656-8035-44fe-b628-eca6c18b7247,deepseek-ai/DeepSeek-V3.1,together_ai,reshard-c4-data,5841,3817,9658,311.898176,False,0.0,deepseek-ai/DeepSeek-V3.1,reshard-c4-data,311.898176,False,0.0,False,311.898176 +04ae2cfa-431b-480f-b18e-eb36b67e8d92,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-with-gcov,6834,1772,8606,266.825228,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-with-gcov,266.825228,False,0.4,False,266.825228 +7d78d8a6-db09-474e-8ffa-19759b4d87d4,gpt-5-mini,openai,video-processing,3970,3577,7547,143.299369,False,0.0,gpt-5-mini,video-processing,143.299369,False,0.0,False,143.299369 +d7ad3f3c-4088-4f8b-b5dc-6f031e954c42,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,password-recovery,5791,5230,11021,924.365593,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,password-recovery,924.365593,False,0.2,False,924.365593 +0b4069cb-260e-478a-a508-01fbd6e5c766,openai/gpt-oss-120b,together_ai,pypi-server,2310,989,3299,90.523169,False,0.0,openai/gpt-oss-120b,pypi-server,90.523169,False,0.4,False,90.523169 +98b8eb3e-c817-4dc4-866b-a13c87499d34,gpt-5-nano,openai,qemu-alpine-ssh,3176,8349,11525,963.531137,False,0.0,gpt-5-nano,qemu-alpine-ssh,963.531137,False,0.0,False,963.531137 +af7efeb7-e8c7-4173-bc05-eb8656230d98,claude-opus-4-1-20250805,anthropic,tune-mjcf,9033,7751,16784,970.238686,False,0.0,claude-opus-4-1-20250805,tune-mjcf,970.238686,False,0.25,False,970.238686 +fb27d323-5f8d-455e-adb1-98ff41cc4828,claude-sonnet-4-20250514,anthropic,db-wal-recovery,4967,6571,11538,862.900372,False,0.0,claude-sonnet-4-20250514,db-wal-recovery,862.900372,False,0.0,False,862.900372 +1da65ffb-e7a9-4ee8-8839-871df824e61a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pypi-server,5564,4076,9640,540.424395,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pypi-server,540.424395,False,0.0,False,540.424395 +34f30856-3acf-421e-8f76-960f02eb687e,claude-opus-4-1-20250805,anthropic,build-pmars,12262,3337,15599,435.413576,True,1.0,claude-opus-4-1-20250805,build-pmars,435.413576,True,0.5,True,435.413576 +13f81cda-2878-447b-b986-02fe56452509,gpt-5-mini,openai,fix-git,5777,5263,11040,900.95335,False,0.0,gpt-5-mini,fix-git,900.95335,False,0.6,False,900.95335 +dd72bad8-9918-415b-a0cc-c298d137d9eb,claude-opus-4-1-20250805,anthropic,torch-tensor-parallelism,2962,2247,5209,146.856933,False,0.0,claude-opus-4-1-20250805,torch-tensor-parallelism,146.856933,False,0.0,False,146.856933 +c6abca5f-3cae-432f-a5ea-cd321f7540f6,openai/gpt-oss-120b,together_ai,pytorch-model-recovery,7308,4865,12173,306.707442,True,1.0,openai/gpt-oss-120b,pytorch-model-recovery,306.707442,True,0.4,True,306.707442 +7bc5b685-774e-4fe3-bced-e123d29063d3,gpt-5-nano,openai,build-pmars,5389,4164,9553,933.897896,False,0.0,gpt-5-nano,build-pmars,933.897896,False,0.0,False,933.897896 +5018f689-0021-4208-a8ab-6122d6ffe698,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,openssl-selfsigned-cert,2246,1928,4174,252.476998,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,openssl-selfsigned-cert,252.476998,False,0.0,False,252.476998 +59c802b1-0442-4c9e-80d7-6a433ca26c60,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-cli,6937,2930,9867,384.687979,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-cli,384.687979,False,0.0,False,384.687979 +afb60f89-d9f6-4894-b6b5-9f35ba9ac2d2,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,db-wal-recovery,1988,1368,3356,42.300927,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,db-wal-recovery,42.300927,False,0.0,False,42.300927 +f04ee6a2-e734-45ea-aee0-a12fc823ddc1,gpt-5,openai,prove-plus-comm,1499,886,2385,102.975392,True,1.0,gpt-5,prove-plus-comm,102.975392,True,0.8571428571428571,True,102.975392 +cdb5f530-a060-4479-acd7-63786decb16a,claude-opus-4-1-20250805,anthropic,mteb-leaderboard,2673,2369,5042,97.987328,False,0.0,claude-opus-4-1-20250805,mteb-leaderboard,97.987328,False,0.0,False,97.987328 +1a00b578-0289-44b6-ac5c-159e90734e2d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-rust-c,7948,8380,16328,913.178116,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-rust-c,913.178116,False,0.0,False,913.178116 +7fd45ec5-7685-4c14-99d4-81750630eecf,grok-4-0709,xai,feal-linear-cryptanalysis,6290,4832,11122,1803.391062,False,0.0,grok-4-0709,feal-linear-cryptanalysis,1803.391062,False,0.0,False,1803.391062 +9b66bc7e-e7e5-4d0f-8331-0ce670317fc3,gemini-2.5-pro,gemini,chess-best-move,18759,6033,24792,906.223259,False,0.0,gemini-2.5-pro,chess-best-move,906.223259,False,0.0,False,906.223259 +66702491-3acb-429d-819d-7dc3b15ffc0e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cobol-modernization,7005,5913,12918,900.009431,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cobol-modernization,900.009431,False,0.4,False,900.009431 +20f53b78-d932-4bdf-bd4d-ca39e6128522,gemini-2.5-pro,gemini,merge-diff-arc-agi-task,12539,2809,15348,791.547286,False,0.0,gemini-2.5-pro,merge-diff-arc-agi-task,791.547286,False,0.6,False,791.547286 +48d37d5e-21b1-4335-a68d-9240069cc0a0,claude-sonnet-4-20250514,anthropic,chess-best-move,7449,6212,13661,301.786249,False,0.0,claude-sonnet-4-20250514,chess-best-move,301.786249,False,0.0,False,301.786249 +54a3a571-d2c5-4f78-8d03-2be7406f44e2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,gpt2-codegolf,14488,15487,29975,910.802121,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,gpt2-codegolf,910.802121,False,0.0,False,910.802121 +5f99ceed-1b2d-4d59-95b1-1a6f66db194a,gemini-2.5-pro,gemini,sqlite-with-gcov,4826,1451,6277,431.608876,True,1.0,gemini-2.5-pro,sqlite-with-gcov,431.608876,True,0.8,True,431.608876 +7eaf2575-5a2d-44e1-bd1d-8d5ec64bf32c,OpenAI/gpt-oss-20B,together_ai,hf-model-inference,3207,850,4057,66.961364,True,1.0,OpenAI/gpt-oss-20B,hf-model-inference,66.961364,True,0.4,True,66.961364 +31d7385d-7080-46cc-a45d-b40493ab9aca,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-rust-c,5774,6509,12283,921.516485,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-rust-c,921.516485,False,0.0,False,921.516485 +0b8e5b1b-837a-4ec5-b4f2-585390455db3,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-leaderboard,23186,7404,30590,495.884827,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-leaderboard,495.884827,False,0.0,False,495.884827 +4819bfcf-4bef-42f7-817b-bc90db91591d,gpt-5-mini,openai,feal-differential-cryptanalysis,2363,1512,3875,289.31515,False,0.0,gpt-5-mini,feal-differential-cryptanalysis,289.31515,False,0.0,False,289.31515 +00f79366-76ce-4807-bbae-689c2ff19ad2,OpenAI/gpt-oss-20B,together_ai,qemu-startup,1182,1367,2549,114.005648,False,0.0,OpenAI/gpt-oss-20B,qemu-startup,114.005648,False,0.0,False,114.005648 +21b2037d-6b8c-4d01-9401-17e28f2ed86d,zai-org/GLM-4.5-Air-FP8,together_ai,extract-elf,1964,2798,4762,232.990402,False,0.0,zai-org/GLM-4.5-Air-FP8,extract-elf,232.990402,False,0.4,False,232.990402 +3e4cb9a3-00ac-4868-b084-b8f2871e4cde,gpt-5-nano,openai,configure-git-webserver,8776,2538,11314,329.591897,False,0.0,gpt-5-nano,configure-git-webserver,329.591897,False,0.2,False,329.591897 +425b45f3-b832-4134-bd51-012e72299d4b,OpenAI/gpt-oss-20B,together_ai,qemu-alpine-ssh,1423,8569,9992,118.064231,False,0.0,OpenAI/gpt-oss-20B,qemu-alpine-ssh,118.064231,False,0.0,False,118.064231 +998d54e9-c88c-4c19-93e6-258e91576be6,claude-opus-4-1-20250805,anthropic,merge-diff-arc-agi-task,11333,4916,16249,198.706254,True,1.0,claude-opus-4-1-20250805,merge-diff-arc-agi-task,198.706254,True,0.3333333333333333,True,198.706254 +a3a35965-dc8f-4b86-ad1d-f79f00896bf8,gpt-5,openai,filter-js-from-html,3888,4948,8836,361.536895,False,0.0,gpt-5,filter-js-from-html,361.536895,False,0.0,False,361.536895 +2922d35d-5727-44ed-85b6-9d7f1833b8b5,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-mips-interpreter,34264,28573,62837,4841.018785,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-mips-interpreter,4841.018785,False,0.0,False,4841.018785 +f51d2b46-f004-41e9-8e58-d9bb4c8e4b6e,gemini-2.5-pro,gemini,build-initramfs-qemu,8615,3323,11938,900.00074,False,0.0,gemini-2.5-pro,build-initramfs-qemu,900.00074,False,0.0,False,900.00074 +3558e4b0-365e-4230-b6a7-f0a6c0ccc2ec,zai-org/GLM-4.5-Air-FP8,together_ai,run-pdp11-code,755,2276,3031,1065.2798,False,0.0,zai-org/GLM-4.5-Air-FP8,run-pdp11-code,1065.2798,False,0.0,False,1065.2798 +993cd909-95ef-481f-b644-d3c46cce1840,claude-opus-4-1-20250805,anthropic,sparql-university,6570,2430,9000,217.618223,False,0.0,claude-opus-4-1-20250805,sparql-university,217.618223,False,0.0,False,217.618223 +25083454-81a4-4057-8b40-deefef05a2c6,claude-opus-4-1-20250805,anthropic,reverse-engineering,26865,18475,45340,1895.828497,False,0.0,claude-opus-4-1-20250805,reverse-engineering,1895.828497,False,0.0,False,1895.828497 +90647da0-6851-4edf-8949-2218f4331045,claude-sonnet-4-20250514,anthropic,pypi-server,6180,3598,9778,570.69396,True,1.0,claude-sonnet-4-20250514,pypi-server,570.69396,True,0.8,True,570.69396 +5b43a50e-c179-4749-bec9-4e61b6a09273,OpenAI/gpt-oss-20B,together_ai,build-pmars,168,1151,1319,155.506388,False,0.0,OpenAI/gpt-oss-20B,build-pmars,155.506388,False,0.0,False,155.506388 +9e7a0b84-264c-42ff-b403-90d9702e7d62,claude-opus-4-1-20250805,anthropic,circuit-fibsqrt,54056,60362,114418,3612.399691,False,0.0,claude-opus-4-1-20250805,circuit-fibsqrt,3612.399691,False,0.0,False,3612.399691 +d768fac9-7968-492f-8224-5ede70c87908,claude-opus-4-1-20250805,anthropic,constraints-scheduling,5288,3438,8726,199.218903,True,1.0,claude-opus-4-1-20250805,constraints-scheduling,199.218903,True,0.8888888888888888,True,199.218903 +da21f184-3c41-4be5-ae08-b586a61cf701,gemini-2.5-pro,gemini,sqlite-with-gcov,9420,1527,10947,263.09336,True,1.0,gemini-2.5-pro,sqlite-with-gcov,263.09336,True,0.8,True,263.09336 +625cfd07-98f0-476d-bca7-95a46f4521fe,moonshotai/Kimi-K2-Instruct-0905,together_ai,circuit-fibsqrt,15834,16259,32093,1370.503314,False,0.0,moonshotai/Kimi-K2-Instruct-0905,circuit-fibsqrt,1370.503314,False,0.0,False,1370.503314 +255d41b0-9bda-4df7-8fed-0231f3d3cbdd,grok-4-0709,xai,large-scale-text-editing,1930,1211,3141,579.085318,False,0.0,grok-4-0709,large-scale-text-editing,579.085318,False,0.4,False,579.085318 +55641752-0e34-44cf-8868-77b2a4ab1435,grok-code-fast-1,xai,torch-tensor-parallelism,1571,909,2480,53.174904,False,0.0,grok-code-fast-1,torch-tensor-parallelism,53.174904,False,0.0,False,53.174904 +78863453-ab9c-49be-96e2-1b4c3270122d,gpt-5-mini,openai,install-klee-minimal,7427,4009,11436,903.03984,False,0.0,gpt-5-mini,install-klee-minimal,903.03984,False,0.0,False,903.03984 +2d94aae1-15e3-4a1e-ba0d-0e98c96d3c94,moonshotai/Kimi-K2-Instruct-0905,together_ai,cancel-async-tasks,2519,1849,4368,289.044358,False,0.0,moonshotai/Kimi-K2-Instruct-0905,cancel-async-tasks,289.044358,False,0.6,False,289.044358 +3b43e2b5-a1b0-4bce-b825-c1bd26347e87,gpt-5-mini,openai,adaptive-rejection-sampler,9263,15224,24487,772.160986,False,0.0,gpt-5-mini,adaptive-rejection-sampler,772.160986,False,0.4,False,772.160986 +09a4e990-4665-43ed-9ca7-88ffb38cf655,grok-4-0709,xai,wasm-pipeline,6689,2723,9412,475.233157,False,0.0,grok-4-0709,wasm-pipeline,475.233157,False,0.4,False,475.233157 +8edecf4d-e355-4abd-844f-031f1aabdbe2,gpt-5-mini,openai,sanitize-git-repo,3927,4040,7967,207.200411,False,0.0,gpt-5-mini,sanitize-git-repo,207.200411,False,0.0,False,207.200411 +b1f60041-2da9-4b86-9269-bd16f9fd9cf8,moonshotai/Kimi-K2-Instruct-0905,together_ai,cancel-async-tasks,2649,2443,5092,231.979442,True,1.0,moonshotai/Kimi-K2-Instruct-0905,cancel-async-tasks,231.979442,True,0.6,True,231.979442 +f96e7606-ded0-4ecb-801a-b7d70ff5bd4a,deepseek-ai/DeepSeek-V3.1,together_ai,fix-ocaml-gc,38866,16010,54876,1970.995101,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-ocaml-gc,1970.995101,False,0.0,False,1970.995101 +8580107b-763a-48a6-9d83-973fd4fbb276,grok-4-0709,xai,build-initramfs-qemu,5611,6225,11836,900.0023,False,0.0,grok-4-0709,build-initramfs-qemu,900.0023,False,0.0,False,900.0023 +fc18deba-5397-401a-92cc-72ff6614f77c,deepseek-ai/DeepSeek-V3.1,together_ai,wasm-pipeline,8501,6410,14911,919.386683,False,0.0,deepseek-ai/DeepSeek-V3.1,wasm-pipeline,919.386683,False,0.4,False,919.386683 +ad324328-3962-49e4-9455-cdda48b9045c,claude-opus-4-1-20250805,anthropic,adaptive-rejection-sampler,8573,8358,16931,1318.187283,False,0.0,claude-opus-4-1-20250805,adaptive-rejection-sampler,1318.187283,False,0.125,False,1318.187283 +6adae00a-f6b3-4370-890b-aaf8dc8758c3,gemini-2.5-pro,gemini,extract-elf,4151,2041,6192,245.914217,False,0.0,gemini-2.5-pro,extract-elf,245.914217,False,0.0,False,245.914217 +09d959b6-861c-440b-89b9-bc9f7ec41ba3,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,video-processing,2146,1283,3429,67.720195,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,video-processing,67.720195,False,0.0,False,67.720195 +e4dbfd22-bd05-4a4a-9dab-3b7d77445c71,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-initramfs-qemu,8548,6109,14657,874.222941,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-initramfs-qemu,874.222941,False,0.0,False,874.222941 +5007e0fb-fb40-47fb-a2e1-ac6ec308cbec,openai/gpt-oss-120b,together_ai,pytorch-model-recovery,3855,5466,9321,82.945311,False,0.0,openai/gpt-oss-120b,pytorch-model-recovery,82.945311,False,0.4,False,82.945311 +bec4d01e-0376-40c4-bb79-f792629980f0,zai-org/GLM-4.5-Air-FP8,together_ai,fix-git,7691,3465,11156,101.819031,True,1.0,zai-org/GLM-4.5-Air-FP8,fix-git,101.819031,True,0.6,True,101.819031 +64f73997-df8d-400d-8979-30263167536a,gpt-5-nano,openai,log-summary-date-ranges,7730,6433,14163,270.259882,False,0.0,gpt-5-nano,log-summary-date-ranges,270.259882,False,0.0,False,270.259882 +bf984497-d26d-4954-b0a9-af0b58c66839,openai/gpt-oss-120b,together_ai,feal-linear-cryptanalysis,14864,11280,26144,667.512408,True,1.0,openai/gpt-oss-120b,feal-linear-cryptanalysis,667.512408,True,0.4,True,667.512408 +f7eb3c92-6b46-4021-8a20-a109bb54dd22,claude-opus-4-1-20250805,anthropic,crack-7z-hash,15195,4572,19767,574.585282,True,1.0,claude-opus-4-1-20250805,crack-7z-hash,574.585282,True,0.8888888888888888,True,574.585282 +390be1f7-92b8-4ab0-80ab-550db4ffdc95,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-cython-ext,16358,5054,21412,528.82896,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-cython-ext,528.82896,False,0.0,False,528.82896 +05e82edc-e480-4112-8c51-1004cf27052f,zai-org/GLM-4.5-Air-FP8,together_ai,code-from-image,3225,7754,10979,1150.170613,False,0.0,zai-org/GLM-4.5-Air-FP8,code-from-image,1150.170613,False,0.2,False,1150.170613 +171affe1-ba43-49da-86b0-969956d3ab68,claude-opus-4-1-20250805,anthropic,financial-document-processor,11205,3946,15151,499.256021,False,0.0,claude-opus-4-1-20250805,financial-document-processor,499.256021,False,0.0,False,499.256021 +fd26450e-0802-4612-86ef-179e5b4a258f,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-startup,2162,1769,3931,1009.572981,False,0.0,deepseek-ai/DeepSeek-V3.1,qemu-startup,1009.572981,False,0.2,False,1009.572981 +8ae977fd-44c3-40be-bbec-1c14ebd4fc5e,grok-code-fast-1,xai,wasm-pipeline,5222,4342,9564,219.877135,False,0.0,grok-code-fast-1,wasm-pipeline,219.877135,False,0.2,False,219.877135 +1a6d60d2-b17d-422d-bb7b-094840bc7eea,openai/gpt-oss-120b,together_ai,extract-elf,6413,4289,10702,213.657684,True,1.0,openai/gpt-oss-120b,extract-elf,213.657684,True,0.4,True,213.657684 +7fdac6dc-eb54-4b8f-bf04-393ca58b6afd,gemini-2.5-pro,gemini,code-from-image,5850,1922,7772,196.741165,True,1.0,gemini-2.5-pro,code-from-image,196.741165,True,1.0,True,196.741165 +44db6da9-f3f8-4344-88af-74627abe5796,grok-code-fast-1,xai,make-doom-for-mips,16264,4300,20564,739.340836,False,0.0,grok-code-fast-1,make-doom-for-mips,739.340836,False,0.0,False,739.340836 +253fc76a-b10c-409c-84a9-307abcb25b2c,claude-sonnet-4-20250514,anthropic,crack-7z-hash,8968,3501,12469,454.122763,True,1.0,claude-sonnet-4-20250514,crack-7z-hash,454.122763,True,1.0,True,454.122763 +57f0d009-60f9-479e-8556-ab0ad4d2ed68,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-windows-3.11,5075,2790,7865,206.796109,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-windows-3.11,206.796109,False,0.0,False,206.796109 +088e3e03-89f2-40ec-9469-a86763ad9b58,gemini-2.5-flash,gemini,port-compressor,99216,121176,220392,3600.001766,False,0.0,gemini-2.5-flash,port-compressor,3600.001766,False,0.0,False,3600.001766 +c1229020-7a50-449c-9bee-8a594898cfa7,claude-sonnet-4-20250514,anthropic,hf-model-inference,5175,3298,8473,957.470013,True,1.0,claude-sonnet-4-20250514,hf-model-inference,957.470013,True,0.2,True,957.470013 +2457a5ae-6abe-4ca0-95b7-09a0d1082d10,gpt-5-nano,openai,circuit-fibsqrt,5446,4890,10336,388.051787,False,0.0,gpt-5-nano,circuit-fibsqrt,388.051787,False,0.0,False,388.051787 +be58f30a-9afd-40db-b1e7-97ed9f50def6,zai-org/GLM-4.5-Air-FP8,together_ai,crack-7z-hash,18697,4696,23393,900.033434,False,0.0,zai-org/GLM-4.5-Air-FP8,crack-7z-hash,900.033434,False,0.0,False,900.033434 +327bde72-5b7b-4893-969e-35afdda9ad37,gpt-5-nano,openai,break-filter-js-from-html,9837,12135,21972,1200.074658,False,0.0,gpt-5-nano,break-filter-js-from-html,1200.074658,False,0.0,False,1200.074658 +c0eedf95-ceef-4ea6-bffd-d425cc841585,claude-sonnet-4-20250514,anthropic,form-filling,6940,4842,11782,277.06691,True,1.0,claude-sonnet-4-20250514,form-filling,277.06691,True,1.0,True,277.06691 +fec88f33-335d-4ec8-b8a4-230bb16670f1,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-recovery,22687,15609,38296,462.700587,False,0.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-recovery,462.700587,False,0.4,False,462.700587 +7bfe3c5b-0efa-4113-a9de-8eb82f1bd119,gpt-5-mini,openai,tune-mjcf,15553,8067,23620,900.151864,False,0.0,gpt-5-mini,tune-mjcf,900.151864,False,0.0,False,900.151864 +e7ca6a41-bd23-43cc-85ad-03017aed676a,moonshotai/Kimi-K2-Instruct-0905,together_ai,extract-elf,6385,1532,7917,900.000923,True,1.0,moonshotai/Kimi-K2-Instruct-0905,extract-elf,900.000923,True,0.6,True,900.000923 +272dd981-598a-4cec-a6ea-1e1aa5003c26,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-with-gcov,3342,1089,4431,466.470159,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-with-gcov,466.470159,True,0.4,True,466.470159 +b3e08346-d525-426c-b963-e1bf69c9a8f3,gpt-5-mini,openai,build-cython-ext,6541,4600,11141,910.923358,False,0.0,gpt-5-mini,build-cython-ext,910.923358,False,0.2,False,910.923358 +39a144f0-d030-4241-92e0-34e1aa0742b8,OpenAI/gpt-oss-20B,together_ai,break-filter-js-from-html,1104,1974,3078,91.90294,False,0.0,OpenAI/gpt-oss-20B,break-filter-js-from-html,91.90294,False,0.0,False,91.90294 +93830b35-6659-4631-9344-df06c2c6138c,gpt-5-mini,openai,write-compressor,10008,8656,18664,902.392981,False,0.0,gpt-5-mini,write-compressor,902.392981,False,0.0,False,902.392981 +110deeae-2808-416a-8065-00b657deab8f,grok-4-0709,xai,extract-elf,971,2291,3262,529.264059,False,0.0,grok-4-0709,extract-elf,529.264059,False,0.2,False,529.264059 +6589165f-d71c-41ff-b139-ea158ac4eb47,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-code-vulnerability,32802,6633,39435,900.882931,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-code-vulnerability,900.882931,False,0.0,False,900.882931 +7b1d24c4-36ab-4ab0-ad25-19af08413b90,grok-4-0709,xai,path-tracing-reverse,3525,5954,9479,1816.671305,False,0.0,grok-4-0709,path-tracing-reverse,1816.671305,False,0.0,False,1816.671305 +8b44e4fd-0af6-4b87-9907-6af662d9231b,claude-sonnet-4-20250514,anthropic,reshard-c4-data,8668,6544,15212,900.587631,False,0.0,claude-sonnet-4-20250514,reshard-c4-data,900.587631,False,0.0,False,900.587631 +2cd7ee00-e4e0-4b9b-93fb-a0a0927d830e,gemini-2.5-pro,gemini,openssl-selfsigned-cert,2621,1933,4554,145.991291,True,1.0,gemini-2.5-pro,openssl-selfsigned-cert,145.991291,True,0.6,True,145.991291 +5e096801-1e42-4c90-9da0-8e37ad48c35a,openai/gpt-oss-120b,together_ai,sqlite-db-truncate,3374,2827,6201,321.21476,False,0.0,openai/gpt-oss-120b,sqlite-db-truncate,321.21476,False,0.0,False,321.21476 +5a72c8fa-0b3d-49ea-a9e3-945ac438d359,grok-code-fast-1,xai,pytorch-model-recovery,17195,11110,28305,751.082771,True,1.0,grok-code-fast-1,pytorch-model-recovery,751.082771,True,0.8,True,751.082771 +5002fde0-a647-43d4-b942-0f9c6e1dc5ca,OpenAI/gpt-oss-20B,together_ai,db-wal-recovery,1026,1301,2327,68.550202,False,0.0,OpenAI/gpt-oss-20B,db-wal-recovery,68.550202,False,0.0,False,68.550202 +871eadef-c259-4879-9160-9b893e0a0907,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,winning-avg-corewars,8605,5099,13704,585.866595,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,winning-avg-corewars,585.866595,False,0.0,False,585.866595 +a4975c59-a39c-42b0-a418-6de0ad4647ab,deepseek-ai/DeepSeek-V3.1,together_ai,winning-avg-corewars,15261,16614,31875,1357.0253,False,0.0,deepseek-ai/DeepSeek-V3.1,winning-avg-corewars,1357.0253,False,0.0,False,1357.0253 +cab7fb13-e843-4940-b200-1a2265760aac,grok-4-0709,xai,path-tracing-reverse,5027,4786,9813,1807.948347,False,0.0,grok-4-0709,path-tracing-reverse,1807.948347,False,0.0,False,1807.948347 +614a8383-5b89-412d-8883-8f8ec2b340ed,gemini-2.5-flash,gemini,form-filling,17870,18949,36819,903.93215,False,0.0,gemini-2.5-flash,form-filling,903.93215,False,0.0,False,903.93215 +32f14803-ec52-440f-8a12-0cad8c9760ea,OpenAI/gpt-oss-20B,together_ai,build-cython-ext,2425,807,3232,68.01344,False,0.0,OpenAI/gpt-oss-20B,build-cython-ext,68.01344,False,0.0,False,68.01344 +8e09137e-fff0-4cf0-aec0-9f4d90e08748,grok-code-fast-1,xai,feal-linear-cryptanalysis,9319,6534,15853,900.854049,False,0.0,grok-code-fast-1,feal-linear-cryptanalysis,900.854049,False,0.0,False,900.854049 +9d63fab6-6b80-436d-b21b-93131dc19855,moonshotai/Kimi-K2-Instruct-0905,together_ai,openssl-selfsigned-cert,4411,3408,7819,218.3977,False,0.0,moonshotai/Kimi-K2-Instruct-0905,openssl-selfsigned-cert,218.3977,False,0.6,False,218.3977 +24daaac1-2943-4906-b792-3e7994ffc378,gemini-2.5-flash,gemini,cancel-async-tasks,1785,1182,2967,300.163772,False,0.0,gemini-2.5-flash,cancel-async-tasks,300.163772,False,0.2,False,300.163772 +d95b0ca4-5134-4a1e-b994-44f7f3fabcb1,claude-opus-4-1-20250805,anthropic,make-mips-interpreter,64402,53986,118388,1800.000866,False,0.0,claude-opus-4-1-20250805,make-mips-interpreter,1800.000866,False,0.0,False,1800.000866 +f8432166-343e-4898-b4f1-ba88e47b7de4,deepseek-ai/DeepSeek-V3.1,together_ai,sanitize-git-repo,5150,1311,6461,1139.911479,False,0.0,deepseek-ai/DeepSeek-V3.1,sanitize-git-repo,1139.911479,False,0.0,False,1139.911479 +54795e28-9d40-49a7-b026-4e457999adf4,gpt-5-nano,openai,break-filter-js-from-html,8422,9742,18164,1213.599301,False,0.0,gpt-5-nano,break-filter-js-from-html,1213.599301,False,0.0,False,1213.599301 +1f3e5db6-b627-4ace-bd70-be90a2aa6c3d,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,largest-eigenval,12840,5405,18245,585.776452,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,largest-eigenval,585.776452,False,0.0,False,585.776452 +146d3748-d33a-4eaf-a03c-be1b9a411226,openai/gpt-oss-120b,together_ai,count-dataset-tokens,2182,2295,4477,386.720148,False,0.0,openai/gpt-oss-120b,count-dataset-tokens,386.720148,False,0.0,False,386.720148 +4363c7e4-bd6d-45a0-8ebe-0dd794754420,claude-sonnet-4-20250514,anthropic,sqlite-db-truncate,4796,3714,8510,426.912206,False,0.0,claude-sonnet-4-20250514,sqlite-db-truncate,426.912206,False,0.0,False,426.912206 +efdc5c20-1718-47b6-a2b0-32fb91316324,OpenAI/gpt-oss-20B,together_ai,log-summary-date-ranges,566,857,1423,100.720318,False,0.0,OpenAI/gpt-oss-20B,log-summary-date-ranges,100.720318,False,0.0,False,100.720318 +c9a872d7-0547-42ee-ad4c-6844c69dfc4c,OpenAI/gpt-oss-20B,together_ai,configure-git-webserver,4617,1755,6372,254.30957,True,1.0,OpenAI/gpt-oss-20B,configure-git-webserver,254.30957,True,0.2,True,254.30957 +6cd7b1d2-35af-4397-8206-89be66f54870,claude-opus-4-1-20250805,anthropic,sparql-university,5993,2606,8599,339.613775,False,0.0,claude-opus-4-1-20250805,sparql-university,339.613775,False,0.0,False,339.613775 +ae175cae-b553-44fe-9ff9-66df2149cce6,openai/gpt-oss-120b,together_ai,make-mips-interpreter,13875,18140,32015,1800.490537,False,0.0,openai/gpt-oss-120b,make-mips-interpreter,1800.490537,False,0.0,False,1800.490537 +80a0e56c-96ba-4eb9-b8f5-6c48ea4814bc,gpt-5,openai,fix-git,3930,1563,5493,110.055566,True,1.0,gpt-5,fix-git,110.055566,True,1.0,True,110.055566 +06a5b16c-5f7c-4c70-88b4-f0f359cad74f,gpt-5-nano,openai,largest-eigenval,6491,5846,12337,364.138481,False,0.0,gpt-5-nano,largest-eigenval,364.138481,False,0.0,False,364.138481 +06447302-968f-42dd-be7d-d3cbbd38f453,grok-code-fast-1,xai,torch-tensor-parallelism,1758,1124,2882,12.953862,False,0.0,grok-code-fast-1,torch-tensor-parallelism,12.953862,False,0.0,False,12.953862 +4e2e041a-ab53-4e39-8033-020674a4e5de,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,wasm-pipeline,4777,1177,5954,138.191678,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,wasm-pipeline,138.191678,False,0.0,False,138.191678 +c1972cc1-8185-4a4f-bd8b-0bb2dca36c8a,deepseek-ai/DeepSeek-V3.1,together_ai,install-klee-minimal,16186,2304,18490,900.050293,False,0.0,deepseek-ai/DeepSeek-V3.1,install-klee-minimal,900.050293,False,0.0,False,900.050293 +e32b8814-b4e0-4773-8baf-cad93412979b,grok-code-fast-1,xai,adaptive-rejection-sampler,5004,3677,8681,310.526187,False,0.0,grok-code-fast-1,adaptive-rejection-sampler,310.526187,False,0.0,False,310.526187 +d4a79710-cd0f-48dd-8310-b669e97563dc,gemini-2.5-pro,gemini,tune-mjcf,6783,6184,12967,670.397557,True,1.0,gemini-2.5-pro,tune-mjcf,670.397557,True,0.2,True,670.397557 +62ca9656-d6a6-4bfd-a12a-b09a325c9447,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing-reverse,22042,8592,30634,1104.712887,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing-reverse,1104.712887,False,0.0,False,1104.712887 +a22b5c78-9c16-47cb-a16c-e934b5b17471,grok-4-0709,xai,adaptive-rejection-sampler,7268,3381,10649,661.345924,False,0.0,grok-4-0709,adaptive-rejection-sampler,661.345924,False,0.0,False,661.345924 +036e9923-884f-4dab-82bb-b9d46375bee3,gemini-2.5-flash,gemini,fix-code-vulnerability,14250,8700,22950,900.15045,False,0.0,gemini-2.5-flash,fix-code-vulnerability,900.15045,False,0.0,False,900.15045 +ed1466f2-e283-4eec-8d61-dac66e7afbba,grok-4-0709,xai,cobol-modernization,3342,1402,4744,616.530559,False,0.0,grok-4-0709,cobol-modernization,616.530559,False,0.2,False,616.530559 +bcddc2e8-f2d5-4d57-a543-d4c133c811e5,gemini-2.5-flash,gemini,extract-elf,5250,4292,9542,636.028645,True,1.0,gemini-2.5-flash,extract-elf,636.028645,True,0.4,True,636.028645 +394fe1f8-c289-4c5c-b07e-a7169c09b8d0,OpenAI/gpt-oss-20B,together_ai,dna-assembly,2761,5357,8118,328.308152,False,0.0,OpenAI/gpt-oss-20B,dna-assembly,328.308152,False,0.0,False,328.308152 +3fb3b8e3-1895-4e47-af1a-923e770ef1ff,gemini-2.5-flash,gemini,pytorch-model-cli,4436,2032,6468,207.06433,False,0.0,gemini-2.5-flash,pytorch-model-cli,207.06433,False,0.0,False,207.06433 +b2d61631-fc6e-4445-a924-ccaee1f73275,grok-4-0709,xai,git-leak-recovery,1540,1867,3407,902.611469,False,0.0,grok-4-0709,git-leak-recovery,902.611469,False,0.4,False,902.611469 +74b9173e-a84f-4d54-a457-3f778769eb98,deepseek-ai/DeepSeek-V3.1,together_ai,hf-model-inference,7032,1950,8982,152.424247,True,1.0,deepseek-ai/DeepSeek-V3.1,hf-model-inference,152.424247,True,0.8,True,152.424247 +0515143d-404b-466a-a207-0a670edd5207,gpt-5,openai,cobol-modernization,8483,5031,13514,320.6472,True,1.0,gpt-5,cobol-modernization,320.6472,True,1.0,True,320.6472 +e5db8d0b-3435-4784-bcab-a68bac2c70f7,claude-opus-4-1-20250805,anthropic,git-leak-recovery,2751,1678,4429,147.709571,True,1.0,claude-opus-4-1-20250805,git-leak-recovery,147.709571,True,1.0,True,147.709571 +29eb6cff-0a4a-47bf-8ed8-535972a06a4c,openai/gpt-oss-120b,together_ai,constraints-scheduling,4054,5286,9340,297.344998,True,1.0,openai/gpt-oss-120b,constraints-scheduling,297.344998,True,1.0,True,297.344998 +ff39606e-04a5-4885-8ff8-e1b53c5a91c4,gpt-5-nano,openai,build-pmars,20920,8212,29132,936.566649,False,0.0,gpt-5-nano,build-pmars,936.566649,False,0.0,False,936.566649 +a6f6e521-c229-467b-a291-fa4c6b624b75,openai/gpt-oss-120b,together_ai,pypi-server,2713,1374,4087,252.89447,False,0.0,openai/gpt-oss-120b,pypi-server,252.89447,False,0.4,False,252.89447 +8f93f8dd-bda1-43da-90bb-3e34a4ced6a1,deepseek-ai/DeepSeek-V3.1,together_ai,feal-linear-cryptanalysis,24947,26087,51034,1810.565133,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-linear-cryptanalysis,1810.565133,False,0.0,False,1810.565133 +5b5025f3-37f8-4a2f-8f12-2d6d0254cd8c,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-assembly,17738,8627,26365,738.789818,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-assembly,738.789818,False,0.0,False,738.789818 +d3738041-2571-4869-8f9b-d0c6b483f30e,grok-code-fast-1,xai,fix-git,2637,1812,4449,369.801683,False,0.0,grok-code-fast-1,fix-git,369.801683,False,0.2,False,369.801683 +d134c23e-d8aa-40ce-a71e-13709434bdb9,deepseek-ai/DeepSeek-V3.1,together_ai,model-extraction-relu-logits,3298,3008,6306,1025.870373,False,0.0,deepseek-ai/DeepSeek-V3.1,model-extraction-relu-logits,1025.870373,False,0.2,False,1025.870373 +09719bbf-1866-4560-bf4c-d6831caba628,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,schemelike-metacircular-eval,4518,2198,6716,110.246145,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,schemelike-metacircular-eval,110.246145,False,0.0,False,110.246145 +2aba641d-7392-4150-a147-6d3889b8ffed,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-rust-c,11986,11192,23178,900.098759,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-rust-c,900.098759,False,0.0,False,900.098759 +41f13e8c-1b7a-4684-96a4-fbd14fdadeac,claude-opus-4-1-20250805,anthropic,fix-ocaml-gc,46581,27111,73692,3600.001989,False,0.0,claude-opus-4-1-20250805,fix-ocaml-gc,3600.001989,False,0.5,False,3600.001989 +28130f67-13a6-4840-a741-7d55d0380cbc,openai/gpt-oss-120b,together_ai,qemu-startup,1168,747,1915,104.046084,False,0.0,openai/gpt-oss-120b,qemu-startup,104.046084,False,0.0,False,104.046084 +db558e6c-919d-433d-914b-b8d32d8196d6,deepseek-ai/DeepSeek-V3.1,together_ai,make-doom-for-mips,18825,4438,23263,900.002539,False,0.0,deepseek-ai/DeepSeek-V3.1,make-doom-for-mips,900.002539,False,0.0,False,900.002539 +5a08ef44-1b42-44b2-9afd-3898bf4773a0,openai/gpt-oss-120b,together_ai,bn-fit-modify,2620,1890,4510,208.541532,False,0.0,openai/gpt-oss-120b,bn-fit-modify,208.541532,False,0.2,False,208.541532 +b9509375-fdf5-4f21-b8ce-6fcf3c767742,claude-opus-4-1-20250805,anthropic,winning-avg-corewars,18719,16566,35285,4698.226795,False,0.0,claude-opus-4-1-20250805,winning-avg-corewars,4698.226795,False,0.3333333333333333,False,4698.226795 +e3dfe3ec-e6c4-417b-8433-bfc9ab471995,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,count-dataset-tokens,14712,4992,19704,900.323936,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,count-dataset-tokens,900.323936,False,0.0,False,900.323936 +09daf0a3-0be2-4108-84ba-73ed4c8b262e,grok-code-fast-1,xai,form-filling,7116,4328,11444,326.551391,True,1.0,grok-code-fast-1,form-filling,326.551391,True,0.6,True,326.551391 +0a5b4755-e74a-4188-aa96-99d5d7e47808,deepseek-ai/DeepSeek-V3.1,together_ai,build-pmars,9938,2289,12227,252.559786,True,1.0,deepseek-ai/DeepSeek-V3.1,build-pmars,252.559786,True,1.0,True,252.559786 +ef888d92-2b9a-4917-baae-981f37e6f903,gemini-2.5-pro,gemini,schemelike-metacircular-eval,14347,14305,28652,947.104285,False,0.0,gemini-2.5-pro,schemelike-metacircular-eval,947.104285,False,0.0,False,947.104285 +d8586f46-ff91-4510-8d7e-290639b1cccd,openai/gpt-oss-120b,together_ai,nginx-request-logging,3357,1412,4769,136.52262,False,0.0,openai/gpt-oss-120b,nginx-request-logging,136.52262,False,0.4,False,136.52262 +5334ce1c-e444-440d-91b1-dad213c1a1f9,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-recovery,13642,13243,26885,914.338319,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-recovery,914.338319,False,0.4,False,914.338319 +8c4b3e68-ae5f-449f-8144-73be29b7ab11,OpenAI/gpt-oss-20B,together_ai,code-from-image,159,451,610,89.516199,False,0.0,OpenAI/gpt-oss-20B,code-from-image,89.516199,False,0.0,False,89.516199 +00aaeee6-eb73-4c06-a1a5-5290f6acb3d7,claude-opus-4-1-20250805,anthropic,log-summary-date-ranges,7720,1855,9575,295.41452,True,1.0,claude-opus-4-1-20250805,log-summary-date-ranges,295.41452,True,0.8888888888888888,True,295.41452 +2e4bd1d6-0972-4a93-af96-d663469d7e56,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,regex-log,1183,724,1907,68.106004,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,regex-log,68.106004,False,0.0,False,68.106004 +2a842935-93e1-492f-bb3e-df9771f260a5,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-ocaml-gc,28942,15688,44630,3606.099714,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-ocaml-gc,3606.099714,False,0.0,False,3606.099714 +78ef4ba7-9fd2-44ee-9005-86543b3934b4,grok-code-fast-1,xai,schemelike-metacircular-eval,11101,7673,18774,414.705353,False,0.0,grok-code-fast-1,schemelike-metacircular-eval,414.705353,False,0.0,False,414.705353 +3e0b43ee-d1db-4a8c-9ac2-e4e15da730cb,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-cli,11275,5602,16877,900.338713,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-cli,900.338713,False,0.0,False,900.338713 +6cb366ea-282c-4b5b-a7e0-b0df094dab48,gemini-2.5-flash,gemini,merge-diff-arc-agi-task,12628,20352,32980,908.598271,False,0.0,gemini-2.5-flash,merge-diff-arc-agi-task,908.598271,False,0.0,False,908.598271 +12e96ba6-7a79-49b8-b4ce-d963f3473624,gpt-5-nano,openai,build-cython-ext,9547,5979,15526,922.466644,False,0.0,gpt-5-nano,build-cython-ext,922.466644,False,0.0,False,922.466644 +c052e71f-e15e-4d9c-bb70-4ff3600eca4e,gpt-5,openai,chess-best-move,19462,7302,26764,900.000906,False,0.0,gpt-5,chess-best-move,900.000906,False,0.0,False,900.000906 +6c9ffc91-df45-42ea-a4e2-a148e8d02358,OpenAI/gpt-oss-20B,together_ai,mteb-retrieve,1921,740,2661,59.895487,False,0.0,OpenAI/gpt-oss-20B,mteb-retrieve,59.895487,False,0.0,False,59.895487 +f11df8b3-737e-4ccf-b4a5-ef18c483681e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-cli,8080,8162,16242,494.687185,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-cli,494.687185,False,0.0,False,494.687185 +114342a0-333b-4ddc-a403-81fa9e632de9,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-mips-interpreter,26631,20276,46907,1840.534871,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-mips-interpreter,1840.534871,False,0.0,False,1840.534871 +6c00e278-fa95-4adc-ace8-273951085a72,gpt-5,openai,circuit-fibsqrt,14465,7823,22288,1002.388623,True,1.0,gpt-5,circuit-fibsqrt,1002.388623,True,0.6666666666666666,True,1002.388623 +d2987b53-5eb3-489c-860e-497852477770,OpenAI/gpt-oss-20B,together_ai,make-mips-interpreter,5989,25863,31852,1816.206139,False,0.0,OpenAI/gpt-oss-20B,make-mips-interpreter,1816.206139,False,0.0,False,1816.206139 +224c96a0-dd65-4d8f-84f7-d51266b16515,openai/gpt-oss-120b,together_ai,install-windows-3.11,4746,927,5673,68.857492,False,0.0,openai/gpt-oss-120b,install-windows-3.11,68.857492,False,0.0,False,68.857492 +3c148fd0-5f94-4e67-800d-ca9c66f6f0ed,gpt-5-mini,openai,dna-assembly,8665,8200,16865,720.089836,False,0.0,gpt-5-mini,dna-assembly,720.089836,False,0.0,False,720.089836 +1a8e28c9-d2e7-41aa-af05-1fe5c1c4b4f1,gemini-2.5-pro,gemini,large-scale-text-editing,3813,4195,8008,1245.536666,False,0.0,gemini-2.5-pro,large-scale-text-editing,1245.536666,False,0.4,False,1245.536666 +4f7938f8-d277-433b-9663-96df7fc2f290,openai/gpt-oss-120b,together_ai,sparql-university,1564,801,2365,91.231956,False,0.0,openai/gpt-oss-120b,sparql-university,91.231956,False,0.0,False,91.231956 +70120133-6e23-4b6f-9b31-77872a76daf9,gemini-2.5-pro,gemini,cancel-async-tasks,1228,984,2212,391.023943,False,0.0,gemini-2.5-pro,cancel-async-tasks,391.023943,False,0.0,False,391.023943 +0abb0c24-8bb1-4527-ad5a-49d17b2c644d,gpt-5-nano,openai,db-wal-recovery,3078,3068,6146,205.118138,False,0.0,gpt-5-nano,db-wal-recovery,205.118138,False,0.0,False,205.118138 +305db620-a680-43c3-a20f-77999cd2a3fc,gemini-2.5-pro,gemini,pytorch-model-cli,15853,4560,20413,768.194992,True,1.0,gemini-2.5-pro,pytorch-model-cli,768.194992,True,0.4,True,768.194992 +5fc4268a-d7fe-45d6-b59f-9cc28513dfc8,gpt-5,openai,feal-linear-cryptanalysis,9764,4777,14541,345.592296,True,1.0,gpt-5,feal-linear-cryptanalysis,345.592296,True,1.0,True,345.592296 +a70f0bc6-fbba-4caf-beb7-a10780391adb,grok-code-fast-1,xai,torch-tensor-parallelism,1594,982,2576,48.794551,False,0.0,grok-code-fast-1,torch-tensor-parallelism,48.794551,False,0.0,False,48.794551 +4f2f0d63-d419-432b-9d84-44b199b2f309,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-klee-minimal,15974,2389,18363,900.468381,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-klee-minimal,900.468381,False,0.0,False,900.468381 +62c9f64c-22ce-423a-925c-9427a28367a3,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,wasm-pipeline,24572,6469,31041,912.009142,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,wasm-pipeline,912.009142,False,0.6,False,912.009142 +4bba3d44-015c-4200-b85a-ab3e5c8aed1d,OpenAI/gpt-oss-20B,together_ai,bn-fit-modify,3574,20245,23819,1900.158172,False,0.0,OpenAI/gpt-oss-20B,bn-fit-modify,1900.158172,False,0.0,False,1900.158172 +5efd346c-fef8-45e6-ba8e-158bf0485231,claude-sonnet-4-20250514,anthropic,gpt2-codegolf,15734,9325,25059,900.264474,False,0.0,claude-sonnet-4-20250514,gpt2-codegolf,900.264474,False,0.0,False,900.264474 +f43ee00a-b8bd-4ea9-b25a-8fb9de2d7838,moonshotai/Kimi-K2-Instruct-0905,together_ai,sparql-university,2804,1191,3995,906.094128,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sparql-university,906.094128,False,0.0,False,906.094128 +a503c32b-3e8a-4d0f-9b42-dd7690124e76,gpt-5-nano,openai,sqlite-with-gcov,5365,1759,7124,276.664172,True,1.0,gpt-5-nano,sqlite-with-gcov,276.664172,True,0.6,True,276.664172 +dfd2e2db-cb2d-49cb-8c1e-5679d9ac78d2,claude-opus-4-1-20250805,anthropic,hf-model-inference,7101,3438,10539,442.837949,True,1.0,claude-opus-4-1-20250805,hf-model-inference,442.837949,True,0.25,True,442.837949 +e720d6d4-daa6-4ccd-8deb-1db209933c69,zai-org/GLM-4.5-Air-FP8,together_ai,port-compressor,51484,29478,80962,3619.290197,False,0.0,zai-org/GLM-4.5-Air-FP8,port-compressor,3619.290197,False,0.0,False,3619.290197 +b7a8dd81-2bf7-4193-b386-25cac1ee1d96,grok-4-0709,xai,build-cython-ext,16646,6436,23082,900.3513,False,0.0,grok-4-0709,build-cython-ext,900.3513,False,0.0,False,900.3513 +2444cc8f-d451-4a1b-899a-2d3fb4229814,grok-4-0709,xai,gpt2-codegolf,917,425,1342,115.686724,False,0.0,grok-4-0709,gpt2-codegolf,115.686724,False,0.0,False,115.686724 +db70010f-83b4-4ed7-befe-bb8920099f7e,claude-opus-4-1-20250805,anthropic,make-doom-for-mips,26935,11099,38034,900.000328,False,0.0,claude-opus-4-1-20250805,make-doom-for-mips,900.000328,False,0.0,False,900.000328 +d3f18a4f-3473-4420-bd11-a8a99402db36,gpt-5-mini,openai,break-filter-js-from-html,2672,1803,4475,348.146137,False,0.0,gpt-5-mini,break-filter-js-from-html,348.146137,False,0.0,False,348.146137 +ad1bc51a-9353-48f1-9173-b94038eed24a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,db-wal-recovery,4801,5106,9907,619.78663,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,db-wal-recovery,619.78663,False,0.0,False,619.78663 +87950f72-f3a3-4b05-8f32-a298dbd2a7b8,grok-4-0709,xai,train-fasttext,43641,13299,56940,3621.500217,False,0.0,grok-4-0709,train-fasttext,3621.500217,False,0.2,False,3621.500217 +b87d4f01-67da-404e-a6b1-cd464ef4e8fb,gpt-5,openai,make-doom-for-mips,6623,5620,12243,900.033643,False,0.0,gpt-5,make-doom-for-mips,900.033643,False,0.0,False,900.033643 +6752cd91-6165-402d-9106-ed358112f4ab,deepseek-ai/DeepSeek-V3.1,together_ai,merge-diff-arc-agi-task,10121,2641,12762,900.059339,False,0.0,deepseek-ai/DeepSeek-V3.1,merge-diff-arc-agi-task,900.059339,False,0.2,False,900.059339 +09dc4105-c9fc-49da-8959-27c1e147259b,gpt-5-nano,openai,fix-code-vulnerability,4248,2157,6405,941.852106,False,0.0,gpt-5-nano,fix-code-vulnerability,941.852106,False,0.2,False,941.852106 +fa1b68d9-d614-45d9-8ebf-f3a21725b8d9,gpt-5-nano,openai,gpt2-codegolf,9437,9169,18606,900.768369,False,0.0,gpt-5-nano,gpt2-codegolf,900.768369,False,0.0,False,900.768369 +8cf0bd23-e9e7-44d6-b41c-a5071722d981,gpt-5,openai,tune-mjcf,7768,4164,11932,900.711382,False,0.0,gpt-5,tune-mjcf,900.711382,False,0.0,False,900.711382 +b30e7168-b15f-4fc1-ae27-dfd4ecd24dfc,OpenAI/gpt-oss-20B,together_ai,break-filter-js-from-html,1647,4828,6475,104.0089,False,0.0,OpenAI/gpt-oss-20B,break-filter-js-from-html,104.0089,False,0.0,False,104.0089 +d7b35b3c-d36e-403e-8160-f1e5d9dfc1d8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-startup,1615,1002,2617,453.121868,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-startup,453.121868,True,0.4,True,453.121868 +701cfce1-6a2c-4cc5-9905-fb5bd12c66d2,moonshotai/Kimi-K2-Instruct-0905,together_ai,git-leak-recovery,2715,3085,5800,268.991108,True,1.0,moonshotai/Kimi-K2-Instruct-0905,git-leak-recovery,268.991108,True,1.0,True,268.991108 +a32840b5-36e0-4886-8b60-2037a03aa1c8,gpt-5-nano,openai,polyglot-rust-c,6693,9416,16109,905.077738,False,0.0,gpt-5-nano,polyglot-rust-c,905.077738,False,0.0,False,905.077738 +f74ef816-d76c-414c-aea2-2164d75f612b,claude-opus-4-1-20250805,anthropic,build-pov-ray,15123,4310,19433,872.578565,True,1.0,claude-opus-4-1-20250805,build-pov-ray,872.578565,True,0.75,True,872.578565 +ec929e5c-ba62-482e-b0aa-3f85ba5bb945,openai/gpt-oss-120b,together_ai,tune-mjcf,6952,7447,14399,926.456411,False,0.0,openai/gpt-oss-120b,tune-mjcf,926.456411,False,0.2,False,926.456411 +1706e640-86f8-4cad-b7b2-4022e2d9e903,grok-4-0709,xai,break-filter-js-from-html,1947,2164,4111,1212.536861,False,0.0,grok-4-0709,break-filter-js-from-html,1212.536861,False,0.0,False,1212.536861 +640c25ba-22d0-477f-b1d8-a60350a9941f,OpenAI/gpt-oss-20B,together_ai,tune-mjcf,5664,19849,25513,900.031734,False,0.0,OpenAI/gpt-oss-20B,tune-mjcf,900.031734,False,0.0,False,900.031734 +1186f2d0-79ef-4e0b-92a1-3f81921329d5,gemini-2.5-pro,gemini,port-compressor,35117,36134,71251,3611.956151,False,0.0,gemini-2.5-pro,port-compressor,3611.956151,False,0.0,False,3611.956151 +243c8c84-4993-4366-bc85-2760a725db0b,grok-code-fast-1,xai,qemu-startup,1578,790,2368,214.288405,False,0.0,grok-code-fast-1,qemu-startup,214.288405,False,0.0,False,214.288405 +e46ffdbd-30d7-45ed-a7e5-491ff51e0dc5,openai/gpt-oss-120b,together_ai,circuit-fibsqrt,5936,10428,16364,977.746549,False,0.0,openai/gpt-oss-120b,circuit-fibsqrt,977.746549,False,0.0,False,977.746549 +b2ad017f-adf9-4b22-b31e-2335ede5dc87,OpenAI/gpt-oss-20B,together_ai,sanitize-git-repo,971,992,1963,223.962708,False,0.0,OpenAI/gpt-oss-20B,sanitize-git-repo,223.962708,False,0.0,False,223.962708 +f7f96947-2a27-4a59-9a6d-577adb52ad40,zai-org/GLM-4.5-Air-FP8,together_ai,distribution-search,17581,16655,34236,738.994043,False,0.0,zai-org/GLM-4.5-Air-FP8,distribution-search,738.994043,False,0.0,False,738.994043 +1f2e4859-5af4-4c45-b5fc-c47a1e1d7805,gpt-5-nano,openai,port-compressor,26384,33488,59872,3611.687095,False,0.0,gpt-5-nano,port-compressor,3611.687095,False,0.0,False,3611.687095 +ffd4ac71-08c4-4de3-9c7d-359959bca4eb,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-startup,3245,3857,7102,484.467271,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-startup,484.467271,False,0.0,False,484.467271 +5fdadff7-69a0-4d1d-b65e-3c40ff714fef,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,gpt2-codegolf,6423,5759,12182,499.48679,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,gpt2-codegolf,499.48679,False,0.0,False,499.48679 +d27e35f2-1de1-49b6-8dd3-048c9333b51e,openai/gpt-oss-120b,together_ai,train-fasttext,27377,11387,38764,3606.177206,False,0.0,openai/gpt-oss-120b,train-fasttext,3606.177206,False,0.0,False,3606.177206 +8bf3ccaf-39fc-4353-9c94-6d78f0b1b8fd,gemini-2.5-flash,gemini,regex-log,1220,1029,2249,150.324853,False,0.0,gemini-2.5-flash,regex-log,150.324853,False,0.8,False,150.324853 +8beaeca1-7396-4022-b39f-d2d0b04fd2a9,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing-reverse,12256,6873,19129,462.020406,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing-reverse,462.020406,False,0.0,False,462.020406 +97ec64aa-2fcb-4bb7-953e-23a611902e4b,gpt-5-nano,openai,polyglot-c-py,5966,7242,13208,900.141671,False,0.0,gpt-5-nano,polyglot-c-py,900.141671,False,0.0,False,900.141671 +bfaa828b-aea2-4736-887b-bc7a3b9e3710,grok-4-0709,xai,fix-git,2005,1656,3661,572.73406,True,1.0,grok-4-0709,fix-git,572.73406,True,1.0,True,572.73406 +89d626cc-dd10-435f-84d8-5f6ce239d420,OpenAI/gpt-oss-20B,together_ai,log-summary-date-ranges,159,1999,2158,237.287327,False,0.0,OpenAI/gpt-oss-20B,log-summary-date-ranges,237.287327,False,0.0,False,237.287327 +f054b6f0-946d-4feb-8b7c-5b2d85fe5ead,moonshotai/Kimi-K2-Instruct-0905,together_ai,break-filter-js-from-html,5887,8068,13955,1223.14811,False,0.0,moonshotai/Kimi-K2-Instruct-0905,break-filter-js-from-html,1223.14811,False,0.0,False,1223.14811 +3cae6dcf-5752-485a-8f64-9504aaa65a79,claude-sonnet-4-20250514,anthropic,cobol-modernization,6451,5434,11885,900.438976,True,1.0,claude-sonnet-4-20250514,cobol-modernization,900.438976,True,1.0,True,900.438976 +c937d52b-1a16-47af-8f78-8969f2a22df9,gpt-5,openai,port-compressor,26330,42114,68444,3605.03076,False,0.0,gpt-5,port-compressor,3605.03076,False,0.0,False,3605.03076 +020b5cc6-97bc-4df0-8135-4074a49e12e2,gemini-2.5-pro,gemini,train-fasttext,24394,9542,33936,3609.482687,False,0.0,gemini-2.5-pro,train-fasttext,3609.482687,False,0.0,False,3609.482687 +fee2e9ad-5aee-4cd4-894b-26e071c71c93,grok-code-fast-1,xai,install-klee-minimal,4097,1508,5605,479.099412,False,0.0,grok-code-fast-1,install-klee-minimal,479.099412,False,0.0,False,479.099412 +6026fc81-13ef-4c5b-a417-b19c79c72526,claude-sonnet-4-20250514,anthropic,merge-diff-arc-agi-task,17043,10411,27454,408.617625,False,0.0,claude-sonnet-4-20250514,merge-diff-arc-agi-task,408.617625,False,0.0,False,408.617625 +2e52b47e-3ccc-441b-9ca5-2a6b3d4c3b13,openai/gpt-oss-120b,together_ai,sparql-university,4288,1973,6261,135.395173,False,0.0,openai/gpt-oss-120b,sparql-university,135.395173,False,0.0,False,135.395173 +e27c1749-6550-41a1-8151-1e6ed40f2243,gpt-5,openai,install-klee-minimal,4927,2669,7596,901.908794,False,0.0,gpt-5,install-klee-minimal,901.908794,False,0.0,False,901.908794 +1a4a0c7e-5956-4477-ae6a-ae45a1b40979,gemini-2.5-pro,gemini,build-cython-ext,15628,6005,21633,789.476067,False,0.0,gemini-2.5-pro,build-cython-ext,789.476067,False,0.0,False,789.476067 +79b54340-e4c9-474d-ac59-d3058685795c,grok-code-fast-1,xai,password-recovery,1383,1019,2402,166.469868,False,0.0,grok-code-fast-1,password-recovery,166.469868,False,0.0,False,166.469868 +1162e9e5-e3f3-4df8-a004-08c575d8b652,moonshotai/Kimi-K2-Instruct-0905,together_ai,merge-diff-arc-agi-task,28614,17242,45856,904.728393,False,0.0,moonshotai/Kimi-K2-Instruct-0905,merge-diff-arc-agi-task,904.728393,False,0.0,False,904.728393 +eabfef9d-eafc-42e7-9724-16d9569da1d4,OpenAI/gpt-oss-20B,together_ai,merge-diff-arc-agi-task,1379,6027,7406,907.238202,False,0.0,OpenAI/gpt-oss-20B,merge-diff-arc-agi-task,907.238202,False,0.0,False,907.238202 +3448513f-6dac-40e2-9bfe-6b8d08f98d2c,zai-org/GLM-4.5-Air-FP8,together_ai,distribution-search,8672,8766,17438,508.107931,False,0.0,zai-org/GLM-4.5-Air-FP8,distribution-search,508.107931,False,0.0,False,508.107931 +a8977b2d-872f-4cd9-9242-3e58c6e5e4f0,grok-4-0709,xai,fix-ocaml-gc,23068,8000,31068,2283.769183,False,0.0,grok-4-0709,fix-ocaml-gc,2283.769183,False,0.0,False,2283.769183 +dbac6eae-042d-4b33-afc6-4247d2710b99,gpt-5-mini,openai,extract-elf,2567,3341,5908,300.908164,True,1.0,gpt-5-mini,extract-elf,300.908164,True,0.6,True,300.908164 +0bd08ad3-9ba8-432e-b6f5-49acfedc5930,gpt-5-nano,openai,dna-assembly,5425,7746,13171,726.593836,False,0.0,gpt-5-nano,dna-assembly,726.593836,False,0.0,False,726.593836 +92d2235e-1fb7-46aa-8c1c-449e6cca542c,gpt-5-mini,openai,winning-avg-corewars,13084,10161,23245,3619.603306,False,0.0,gpt-5-mini,winning-avg-corewars,3619.603306,False,0.0,False,3619.603306 +bc631276-1e87-44dd-a178-5424cd80fac1,gemini-2.5-flash,gemini,path-tracing,1439,944,2383,1544.269619,False,0.0,gemini-2.5-flash,path-tracing,1544.269619,False,0.0,False,1544.269619 +395a8fdb-2b7a-48be-b3b8-859453c704cb,claude-opus-4-1-20250805,anthropic,pytorch-model-recovery,6745,3055,9800,235.176575,True,1.0,claude-opus-4-1-20250805,pytorch-model-recovery,235.176575,True,1.0,True,235.176575 +4e1fda26-3afc-4927-a098-c1b6734a5939,deepseek-ai/DeepSeek-V3.1,together_ai,distribution-search,26501,21736,48237,2101.630507,False,0.0,deepseek-ai/DeepSeek-V3.1,distribution-search,2101.630507,False,0.0,False,2101.630507 +09d503f6-3201-4e56-afbf-c7fab57aafdf,claude-sonnet-4-20250514,anthropic,tune-mjcf,9274,7828,17102,903.023557,False,0.0,claude-sonnet-4-20250514,tune-mjcf,903.023557,False,0.2,False,903.023557 +2b338aec-06df-42c4-83ca-9331c028f363,gpt-5-nano,openai,log-summary-date-ranges,15942,19429,35371,909.398653,False,0.0,gpt-5-nano,log-summary-date-ranges,909.398653,False,0.0,False,909.398653 +e76f8a22-4753-4a60-a71e-88e90d1a56c4,gpt-5-nano,openai,pypi-server,5716,3188,8904,393.226204,True,1.0,gpt-5-nano,pypi-server,393.226204,True,0.8,True,393.226204 +d4f5757f-9a4d-46a9-ba71-47ad00e5fd46,gemini-2.5-pro,gemini,fix-git,3109,1492,4601,143.464295,True,1.0,gemini-2.5-pro,fix-git,143.464295,True,1.0,True,143.464295 +e037d264-15df-4063-90eb-a7a3e4749ac1,gpt-5,openai,largest-eigenval,5280,5010,10290,915.411873,False,0.0,gpt-5,largest-eigenval,915.411873,False,0.0,False,915.411873 +67323d2f-7b71-4ebf-9a3c-8a246dcb1522,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,write-compressor,20163,7566,27729,904.193577,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,write-compressor,904.193577,False,0.0,False,904.193577 +f3314122-cf6d-4127-a9c1-88463b8ed8dd,gpt-5-mini,openai,chess-best-move,13923,15301,29224,906.753355,False,0.0,gpt-5-mini,chess-best-move,906.753355,False,0.0,False,906.753355 +33dc4748-587a-4c9a-b29c-3d15b7a6fb1f,claude-sonnet-4-20250514,anthropic,winning-avg-corewars,17301,16591,33892,1984.640415,False,0.0,claude-sonnet-4-20250514,winning-avg-corewars,1984.640415,False,0.0,False,1984.640415 +4df69ee3-8d7e-4019-a33b-eb894ad68f4e,gpt-5-mini,openai,code-from-image,15871,9471,25342,1200.219384,False,0.0,gpt-5-mini,code-from-image,1200.219384,False,0.0,False,1200.219384 +6838a0a6-0790-41da-9d9c-f68bd8f86637,gemini-2.5-flash,gemini,port-compressor,61601,97430,159031,3601.907017,False,0.0,gemini-2.5-flash,port-compressor,3601.907017,False,0.0,False,3601.907017 +405b8434-64b0-4a90-8aa1-3cbf32cbc04e,OpenAI/gpt-oss-20B,together_ai,reverse-engineering,1974,7170,9144,2030.025354,False,0.0,OpenAI/gpt-oss-20B,reverse-engineering,2030.025354,False,0.0,False,2030.025354 +ad96c00b-803f-4e0b-b848-aef3941a9bc2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,count-dataset-tokens,13620,4861,18481,906.8158,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,count-dataset-tokens,906.8158,False,0.0,False,906.8158 +101a70a4-b733-4429-87c5-d1145be51387,openai/gpt-oss-120b,together_ai,openssl-selfsigned-cert,1795,1052,2847,40.525633,False,0.0,openai/gpt-oss-120b,openssl-selfsigned-cert,40.525633,False,0.8,False,40.525633 +9926281f-2c4f-4588-8fa3-aa49548459f4,deepseek-ai/DeepSeek-V3.1,together_ai,bn-fit-modify,24628,8292,32920,764.198961,False,0.0,deepseek-ai/DeepSeek-V3.1,bn-fit-modify,764.198961,False,0.0,False,764.198961 +477a1f21-5ce6-4952-b061-3257213448c0,gemini-2.5-flash,gemini,build-cython-ext,17680,6136,23816,928.748796,False,0.0,gemini-2.5-flash,build-cython-ext,928.748796,False,0.0,False,928.748796 +2f25a9ef-f508-4fdb-9826-0e0c442de532,claude-sonnet-4-20250514,anthropic,circuit-fibsqrt,38205,42323,80528,3593.166055,False,0.0,claude-sonnet-4-20250514,circuit-fibsqrt,3593.166055,False,0.0,False,3593.166055 +9f49ab87-9a5d-4f70-a52f-cd6c6584c039,openai/gpt-oss-120b,together_ai,sqlite-db-truncate,6756,4350,11106,347.02981,False,0.0,openai/gpt-oss-120b,sqlite-db-truncate,347.02981,False,0.0,False,347.02981 +eca79742-1a0f-4013-bde1-c703fd850be0,gemini-2.5-pro,gemini,port-compressor,30610,27216,57826,3600.001709,False,0.0,gemini-2.5-pro,port-compressor,3600.001709,False,0.0,False,3600.001709 +e68f4725-38ae-42b7-81e1-4f6c737e77d0,openai/gpt-oss-120b,together_ai,regex-log,1538,1094,2632,82.229762,False,0.0,openai/gpt-oss-120b,regex-log,82.229762,False,0.4,False,82.229762 +210af782-0274-40f2-8fd3-7c6e777b437e,gemini-2.5-pro,gemini,sanitize-git-repo,11460,2504,13964,948.924235,False,0.0,gemini-2.5-pro,sanitize-git-repo,948.924235,False,0.0,False,948.924235 +e1c5f95a-d825-4f41-9020-5feb24e4361a,grok-4-0709,xai,git-leak-recovery,1156,528,1684,202.910628,True,1.0,grok-4-0709,git-leak-recovery,202.910628,True,0.4,True,202.910628 +f26b6302-64ae-4827-9819-be33dfdd6614,gpt-5-mini,openai,make-doom-for-mips,3423,3195,6618,908.727245,False,0.0,gpt-5-mini,make-doom-for-mips,908.727245,False,0.0,False,908.727245 +96d2fadb-b05e-4893-a004-f23de8259aa4,openai/gpt-oss-120b,together_ai,build-pov-ray,21237,12941,34178,5515.988431,False,0.0,openai/gpt-oss-120b,build-pov-ray,5515.988431,False,0.0,False,5515.988431 +ca3764f9-cfd5-424e-bffe-0bb6cc8809e1,gemini-2.5-flash,gemini,wasm-pipeline,10103,2947,13050,386.865551,True,1.0,gemini-2.5-flash,wasm-pipeline,386.865551,True,0.4,True,386.865551 +f13817ec-b542-4da4-9c29-8eafe1352efe,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-retrieve,2534,1897,4431,247.564662,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-retrieve,247.564662,False,0.0,False,247.564662 +d2f9865a-fc4c-4150-b3f2-1e1050e37e80,claude-opus-4-1-20250805,anthropic,gpt2-codegolf,4807,5760,10567,917.690204,False,0.0,claude-opus-4-1-20250805,gpt2-codegolf,917.690204,False,0.0,False,917.690204 +59d9d525-de3e-46c8-9ac2-620e9c62bccc,openai/gpt-oss-120b,together_ai,build-pov-ray,27021,20347,47368,6000.725107,False,0.0,openai/gpt-oss-120b,build-pov-ray,6000.725107,False,0.0,False,6000.725107 +89ae7ef6-f48f-475e-845c-f25139fe011c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,log-summary-date-ranges,4998,2627,7625,115.628928,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,log-summary-date-ranges,115.628928,False,0.0,False,115.628928 +c6c0c9c3-ceff-4a90-a4d7-afcd7cca8143,openai/gpt-oss-120b,together_ai,install-klee-minimal,1498,1658,3156,844.496042,False,0.0,openai/gpt-oss-120b,install-klee-minimal,844.496042,False,0.0,False,844.496042 +9e6d9e23-84d1-49c3-ba09-fca3d1052210,openai/gpt-oss-120b,together_ai,polyglot-c-py,4442,7889,12331,900.698217,False,0.0,openai/gpt-oss-120b,polyglot-c-py,900.698217,False,0.0,False,900.698217 +98ea32dd-cd49-49ab-a20f-77aea9e90139,claude-opus-4-1-20250805,anthropic,filter-js-from-html,6750,8584,15334,199.584844,False,0.0,claude-opus-4-1-20250805,filter-js-from-html,199.584844,False,0.0,False,199.584844 +2a759ffd-5f67-47c7-919c-fc6037c5ba07,gpt-5-mini,openai,port-compressor,26344,35699,62043,3603.732211,False,0.0,gpt-5-mini,port-compressor,3603.732211,False,0.0,False,3603.732211 +6cdfca9a-d1d2-4121-9068-b54e593e747e,grok-4-0709,xai,mteb-retrieve,4393,1710,6103,534.025029,False,0.0,grok-4-0709,mteb-retrieve,534.025029,False,0.0,False,534.025029 +455235f9-312f-467c-9838-c24a11a152eb,gemini-2.5-flash,gemini,cancel-async-tasks,1965,1849,3814,160.217778,False,0.0,gemini-2.5-flash,cancel-async-tasks,160.217778,False,0.2,False,160.217778 +cae30b61-6509-4c48-9a9b-1ca2a188926a,gpt-5-mini,openai,configure-git-webserver,4505,1113,5618,296.458239,True,1.0,gpt-5-mini,configure-git-webserver,296.458239,True,0.6,True,296.458239 +1a053e8f-4280-470f-a8e8-ffb2a6e869f8,claude-sonnet-4-20250514,anthropic,path-tracing-reverse,10662,10929,21591,1630.085549,False,0.0,claude-sonnet-4-20250514,path-tracing-reverse,1630.085549,False,0.0,False,1630.085549 +5774efab-97fd-4112-999f-d57b3591a08e,openai/gpt-oss-120b,together_ai,break-filter-js-from-html,10255,15803,26058,1208.666921,False,0.0,openai/gpt-oss-120b,break-filter-js-from-html,1208.666921,False,0.0,False,1208.666921 +f9411475-ddb3-4b2b-989e-8e98f3f1ecf3,claude-sonnet-4-20250514,anthropic,code-from-image,10091,5967,16058,536.517756,True,1.0,claude-sonnet-4-20250514,code-from-image,536.517756,True,0.2,True,536.517756 +05da3efd-d0f3-4a02-b588-b84c9904fc0e,claude-opus-4-1-20250805,anthropic,circuit-fibsqrt,26225,23277,49502,724.351243,False,0.0,claude-opus-4-1-20250805,circuit-fibsqrt,724.351243,False,0.0,False,724.351243 +bdfb249c-9ee6-4b39-b04b-e2539ff5659a,claude-opus-4-1-20250805,anthropic,model-extraction-relu-logits,7298,11729,19027,578.998697,False,0.0,claude-opus-4-1-20250805,model-extraction-relu-logits,578.998697,False,0.0,False,578.998697 +3751bb05-2ea2-4b84-bf8a-3594ece74bab,zai-org/GLM-4.5-Air-FP8,together_ai,merge-diff-arc-agi-task,12941,6802,19743,246.856887,False,0.0,zai-org/GLM-4.5-Air-FP8,merge-diff-arc-agi-task,246.856887,False,0.0,False,246.856887 +2df9a216-4d5e-4759-87b5-4bd5fbbbbd0f,gpt-5-nano,openai,polyglot-rust-c,6407,4432,10839,252.606981,False,0.0,gpt-5-nano,polyglot-rust-c,252.606981,False,0.0,False,252.606981 +0f838bbd-e6f7-4ae4-9f82-3ff6f4fbd817,claude-opus-4-1-20250805,anthropic,configure-git-webserver,7035,2318,9353,511.925172,True,1.0,claude-opus-4-1-20250805,configure-git-webserver,511.925172,True,0.625,True,511.925172 +66c33fcb-659e-4812-8644-634fd8bc99fb,deepseek-ai/DeepSeek-V3.1,together_ai,install-windows-3.11,10045,3019,13064,335.310874,False,0.0,deepseek-ai/DeepSeek-V3.1,install-windows-3.11,335.310874,False,0.0,False,335.310874 +7759896f-4d72-4d48-84e4-eaf18d9cf937,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,model-extraction-relu-logits,1389,1944,3333,82.556417,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,model-extraction-relu-logits,82.556417,False,0.0,False,82.556417 +96d921ad-2d82-4847-aca9-27bc88441a3c,grok-code-fast-1,xai,bn-fit-modify,10341,2583,12924,514.002196,False,0.0,grok-code-fast-1,bn-fit-modify,514.002196,False,0.0,False,514.002196 +45b665b8-f440-4cf7-89e2-00df40c64b76,grok-4-0709,xai,make-doom-for-mips,14936,3776,18712,915.446561,False,0.0,grok-4-0709,make-doom-for-mips,915.446561,False,0.0,False,915.446561 +21dc4950-581a-43c9-b9c0-3ef43be39b36,claude-opus-4-1-20250805,anthropic,constraints-scheduling,5790,3734,9524,365.262643,True,1.0,claude-opus-4-1-20250805,constraints-scheduling,365.262643,True,0.8888888888888888,True,365.262643 +bb1f978f-7401-4b2d-8877-f5734cf24a72,deepseek-ai/DeepSeek-V3.1,together_ai,write-compressor,9038,7204,16242,311.253096,False,0.0,deepseek-ai/DeepSeek-V3.1,write-compressor,311.253096,False,0.0,False,311.253096 +bb812fde-9294-4228-9db7-fa72b3b96fde,gpt-5,openai,large-scale-text-editing,5817,5344,11161,1205.311247,False,0.0,gpt-5,large-scale-text-editing,1205.311247,False,0.4285714285714285,False,1205.311247 +0f680b06-2d72-4618-998d-51a244056a70,OpenAI/gpt-oss-20B,together_ai,port-compressor,4606,16516,21122,324.349625,False,0.0,OpenAI/gpt-oss-20B,port-compressor,324.349625,False,0.0,False,324.349625 +29f04105-1318-4344-a102-34391b76d4e1,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,torch-tensor-parallelism,4878,3656,8534,94.44862,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,torch-tensor-parallelism,94.44862,False,0.0,False,94.44862 +09713cbb-464c-464f-bfa9-dbee1168de13,moonshotai/Kimi-K2-Instruct-0905,together_ai,circuit-fibsqrt,12104,11576,23680,2370.808709,False,0.0,moonshotai/Kimi-K2-Instruct-0905,circuit-fibsqrt,2370.808709,False,0.0,False,2370.808709 +b630e084-7e40-42a2-808c-86c20bc1a230,openai/gpt-oss-120b,together_ai,qemu-alpine-ssh,1355,2328,3683,110.566921,False,0.0,openai/gpt-oss-120b,qemu-alpine-ssh,110.566921,False,0.0,False,110.566921 +ce9404d9-5f38-4b79-9763-acec983732d4,grok-4-0709,xai,feal-linear-cryptanalysis,4726,2917,7643,1810.901472,False,0.0,grok-4-0709,feal-linear-cryptanalysis,1810.901472,False,0.0,False,1810.901472 +a32654a9-5819-4eeb-bc8e-c5ab09e6281a,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-startup,2076,2509,4585,344.061338,False,0.0,moonshotai/Kimi-K2-Instruct-0905,qemu-startup,344.061338,False,0.4,False,344.061338 +1657b0c7-a2a6-4dab-bad7-9fcb89e0b152,claude-opus-4-1-20250805,anthropic,feal-differential-cryptanalysis,31221,31950,63171,1800.332737,False,0.0,claude-opus-4-1-20250805,feal-differential-cryptanalysis,1800.332737,False,0.0,False,1800.332737 +446f5c8d-1333-4a32-be63-274d95b88d41,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,nginx-request-logging,7580,5889,13469,539.455068,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,nginx-request-logging,539.455068,False,0.0,False,539.455068 +208b35c4-fb6f-4a58-8c9e-47a6c2532430,grok-code-fast-1,xai,chess-best-move,4526,728,5254,66.885994,False,0.0,grok-code-fast-1,chess-best-move,66.885994,False,0.0,False,66.885994 +bd628078-7615-4358-b535-a3418a3ae5af,claude-opus-4-1-20250805,anthropic,pypi-server,5578,2912,8490,127.156995,True,1.0,claude-opus-4-1-20250805,pypi-server,127.156995,True,1.0,True,127.156995 +3a05787b-6b08-4a93-8da8-33450486b97a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,torch-tensor-parallelism,2343,1000,3343,70.14437,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,torch-tensor-parallelism,70.14437,False,0.0,False,70.14437 +7e161c6e-d4cf-4053-b3d8-6175596e50be,claude-sonnet-4-20250514,anthropic,extract-elf,2825,2462,5287,378.624993,False,0.0,claude-sonnet-4-20250514,extract-elf,378.624993,False,0.2,False,378.624993 +91e02959-3ec2-4409-be19-40fd8e445ee3,claude-opus-4-1-20250805,anthropic,distribution-search,40818,59031,99849,2382.451914,True,1.0,claude-opus-4-1-20250805,distribution-search,2382.451914,True,0.5555555555555556,True,2382.451914 +600c9d42-84e0-479e-bcea-f8dd1e735257,zai-org/GLM-4.5-Air-FP8,together_ai,train-fasttext,23071,9548,32619,2748.916437,False,0.0,zai-org/GLM-4.5-Air-FP8,train-fasttext,2748.916437,False,0.2,False,2748.916437 +51484877-d0db-4b4a-88da-c949886f9792,claude-opus-4-1-20250805,anthropic,merge-diff-arc-agi-task,14157,5347,19504,473.351028,False,0.0,claude-opus-4-1-20250805,merge-diff-arc-agi-task,473.351028,False,0.3333333333333333,False,473.351028 +f9f5040e-e07c-4047-a7bf-f0d6b5f78e7a,claude-opus-4-1-20250805,anthropic,break-filter-js-from-html,22612,24696,47308,1200.001203,False,0.0,claude-opus-4-1-20250805,break-filter-js-from-html,1200.001203,False,0.2222222222222222,False,1200.001203 +41972ba3-40f1-401f-8e1b-9b1f30d968ee,gpt-5-nano,openai,fix-git,9579,7525,17104,914.106193,False,0.0,gpt-5-nano,fix-git,914.106193,False,0.0,False,914.106193 +1eba1354-4db4-4665-81f8-fcc0fdb58cb1,claude-sonnet-4-20250514,anthropic,sqlite-with-gcov,11761,3282,15043,486.47177,False,0.0,claude-sonnet-4-20250514,sqlite-with-gcov,486.47177,False,0.2,False,486.47177 +640c6edb-f40e-4380-86d9-438f9e24839d,zai-org/GLM-4.5-Air-FP8,together_ai,dna-insert,11983,6532,18515,617.783595,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-insert,617.783595,False,0.0,False,617.783595 +d3a6f04d-14e8-4ff4-9dc6-0abd8dfbd2a0,gpt-5-mini,openai,merge-diff-arc-agi-task,7161,4885,12046,909.820458,False,0.0,gpt-5-mini,merge-diff-arc-agi-task,909.820458,False,0.4,False,909.820458 +86698a4e-39a5-4a74-91e1-87c1108d267f,moonshotai/Kimi-K2-Instruct-0905,together_ai,torch-tensor-parallelism,12720,3656,16376,548.275601,False,0.0,moonshotai/Kimi-K2-Instruct-0905,torch-tensor-parallelism,548.275601,False,0.0,False,548.275601 +8220946e-12f7-4fb8-908e-43039408601e,gpt-5-mini,openai,large-scale-text-editing,1660,929,2589,146.349982,False,0.0,gpt-5-mini,large-scale-text-editing,146.349982,False,0.2,False,146.349982 +0220ba0e-a034-4a0e-b31e-0b5e446e45cc,gemini-2.5-flash,gemini,qemu-startup,1255,1059,2314,81.959598,False,0.0,gemini-2.5-flash,qemu-startup,81.959598,False,0.2,False,81.959598 +095634db-b3bd-4bae-aab7-d37d2155318d,gpt-5,openai,crack-7z-hash,10148,5059,15207,735.296622,True,1.0,gpt-5,crack-7z-hash,735.296622,True,0.4285714285714285,True,735.296622 +00ba2e3f-ac3c-4c49-bcdd-9956db30b810,deepseek-ai/DeepSeek-V3.1,together_ai,install-klee-minimal,15187,1917,17104,900.52118,False,0.0,deepseek-ai/DeepSeek-V3.1,install-klee-minimal,900.52118,False,0.0,False,900.52118 +0a83829c-c44e-4ab6-9cfa-6418dd9037be,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-c-py,3470,1848,5318,757.492192,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-c-py,757.492192,False,0.0,False,757.492192 +f4e9d225-b058-4d23-8ade-0e0807db12b8,gemini-2.5-pro,gemini,video-processing,15539,18831,34370,1271.858999,False,0.0,gemini-2.5-pro,video-processing,1271.858999,False,0.0,False,1271.858999 +aab53a59-5ee6-49f9-8d18-9a7e202b3bc5,openai/gpt-oss-120b,together_ai,largest-eigenval,8452,7563,16015,900.002571,False,0.0,openai/gpt-oss-120b,largest-eigenval,900.002571,False,0.0,False,900.002571 +6ea4f896-8f6e-4e95-9751-e1bad37e10b2,claude-opus-4-1-20250805,anthropic,cobol-modernization,7397,4353,11750,478.885807,True,1.0,claude-opus-4-1-20250805,cobol-modernization,478.885807,True,0.875,True,478.885807 +da22d103-c125-4b0a-a191-774618359ebc,deepseek-ai/DeepSeek-V3.1,together_ai,video-processing,10560,9133,19693,429.39043,False,0.0,deepseek-ai/DeepSeek-V3.1,video-processing,429.39043,False,0.0,False,429.39043 +84240b1c-ddc2-4252-a0ce-1f6ddb238e5c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-initramfs-qemu,1595,862,2457,91.746305,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-initramfs-qemu,91.746305,False,0.0,False,91.746305 +3444cf90-0da6-4132-90e3-965cc6257dda,OpenAI/gpt-oss-20B,together_ai,prove-plus-comm,348,386,734,60.608726,False,0.0,OpenAI/gpt-oss-20B,prove-plus-comm,60.608726,False,0.0,False,60.608726 +03667af4-0c30-4352-ab3b-9ce5de3059d1,deepseek-ai/DeepSeek-V3.1,together_ai,fix-ocaml-gc,50804,26706,77510,3284.454139,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-ocaml-gc,3284.454139,False,0.0,False,3284.454139 +3f78b1e8-cb9d-4af8-b2c7-e903385708df,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pypi-server,4713,3260,7973,916.468089,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pypi-server,916.468089,False,0.0,False,916.468089 +71586f18-147f-4470-af96-cd90279d7797,gpt-5,openai,openssl-selfsigned-cert,2458,1532,3990,161.294279,True,1.0,gpt-5,openssl-selfsigned-cert,161.294279,True,1.0,True,161.294279 +c03d7a65-331c-4eff-bc96-f7303af5fca0,gpt-5-nano,openai,sqlite-db-truncate,10186,13889,24075,900.049675,False,0.0,gpt-5-nano,sqlite-db-truncate,900.049675,False,0.0,False,900.049675 +659a64cf-6cec-461d-be27-ba80f0230a3c,gpt-5-nano,openai,sqlite-with-gcov,6549,8186,14735,900.019909,False,0.0,gpt-5-nano,sqlite-with-gcov,900.019909,False,0.6,False,900.019909 +25a59681-30bd-494c-8d91-a7320a56800c,claude-sonnet-4-20250514,anthropic,nginx-request-logging,6477,3692,10169,237.665196,True,1.0,claude-sonnet-4-20250514,nginx-request-logging,237.665196,True,1.0,True,237.665196 +1cacca91-de7c-49fd-9523-7f3daa0bec69,zai-org/GLM-4.5-Air-FP8,together_ai,feal-differential-cryptanalysis,3870,2963,6833,55.728406,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-differential-cryptanalysis,55.728406,False,0.0,False,55.728406 +142c88ab-1bfc-4243-8a50-441a4e82567d,openai/gpt-oss-120b,together_ai,adaptive-rejection-sampler,8760,8467,17227,701.928281,False,0.0,openai/gpt-oss-120b,adaptive-rejection-sampler,701.928281,False,0.0,False,701.928281 +ea726cef-402c-4aaf-80f0-e3c7b63ed41a,grok-4-0709,xai,sqlite-db-truncate,3510,1437,4947,900.016756,False,0.0,grok-4-0709,sqlite-db-truncate,900.016756,False,0.0,False,900.016756 +167f9707-2009-463e-aac0-23434c79828a,gpt-5-mini,openai,log-summary-date-ranges,5741,2396,8137,136.758542,False,0.0,gpt-5-mini,log-summary-date-ranges,136.758542,False,0.0,False,136.758542 +9bdf3eb5-4198-44d1-85f8-109fd136eedb,gpt-5,openai,chess-best-move,20535,7844,28379,900.001182,False,0.0,gpt-5,chess-best-move,900.001182,False,0.0,False,900.001182 +0f3f110a-3987-43ef-9774-6a0428e6a22e,gemini-2.5-pro,gemini,sanitize-git-repo,11955,2178,14133,1176.674548,False,0.0,gemini-2.5-pro,sanitize-git-repo,1176.674548,False,0.0,False,1176.674548 +45d4a871-c0d3-46a8-bf94-b396141700ea,OpenAI/gpt-oss-20B,together_ai,git-leak-recovery,700,528,1228,106.92239,False,0.0,OpenAI/gpt-oss-20B,git-leak-recovery,106.92239,False,0.0,False,106.92239 +e1a72fef-b8cd-46bb-8aa3-f504a431046c,gpt-5-mini,openai,cancel-async-tasks,1847,1362,3209,119.909751,False,0.0,gpt-5-mini,cancel-async-tasks,119.909751,False,0.4,False,119.909751 +3155d64f-1f4f-47c9-af01-b40e8f88f552,gpt-5-nano,openai,sqlite-with-gcov,4802,1907,6709,108.302722,False,0.0,gpt-5-nano,sqlite-with-gcov,108.302722,False,0.6,False,108.302722 +149466b5-6db1-4d8b-8283-657408679c3a,gpt-5,openai,pypi-server,3211,1427,4638,163.696097,True,1.0,gpt-5,pypi-server,163.696097,True,0.3333333333333333,True,163.696097 +fdd88afb-f22c-4dc6-9172-7c41dc25da59,gpt-5,openai,financial-document-processor,18331,12113,30444,955.653402,False,0.0,gpt-5,financial-document-processor,955.653402,False,0.0,False,955.653402 +22ff6409-3676-44da-8361-fd93f8004708,openai/gpt-oss-120b,together_ai,dna-assembly,2892,2053,4945,85.843506,False,0.0,openai/gpt-oss-120b,dna-assembly,85.843506,False,0.0,False,85.843506 +2fdd2d38-9517-4155-8476-f0f16316c48b,gpt-5-mini,openai,merge-diff-arc-agi-task,9016,5994,15010,587.371606,True,1.0,gpt-5-mini,merge-diff-arc-agi-task,587.371606,True,0.4,True,587.371606 +e2502451-d4ef-4f33-9466-cd239cc9208a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,regex-log,2871,3070,5941,283.320473,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,regex-log,283.320473,False,0.2,False,283.320473 +d0d9f21c-f0e4-46a9-9f67-789abecb4913,claude-opus-4-1-20250805,anthropic,git-leak-recovery,2888,1866,4754,119.716484,True,1.0,claude-opus-4-1-20250805,git-leak-recovery,119.716484,True,1.0,True,119.716484 +ef1dfe3a-22d5-4aa2-9d81-f53220c3591f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-with-gcov,10743,2196,12939,281.09867,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-with-gcov,281.09867,False,0.6,False,281.09867 +b1ac6ea8-a88a-44f7-8a57-694326aea6cb,grok-4-0709,xai,bn-fit-modify,14161,8529,22690,1895.533263,False,0.0,grok-4-0709,bn-fit-modify,1895.533263,False,0.6,False,1895.533263 +be64ed93-47b3-4cb4-94d3-55d1b9f6da75,claude-opus-4-1-20250805,anthropic,pytorch-model-cli,1800,1059,2859,900.510233,False,0.0,claude-opus-4-1-20250805,pytorch-model-cli,900.510233,False,0.4285714285714285,False,900.510233 +fbf21dcc-dc60-4165-9d8f-be4331582349,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-insert,7717,3385,11102,380.849063,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-insert,380.849063,False,0.0,False,380.849063 +c931cdb9-5ce8-4b57-b843-3ac1c8db6239,claude-opus-4-1-20250805,anthropic,install-klee-minimal,16649,2233,18882,913.912962,False,0.0,claude-opus-4-1-20250805,install-klee-minimal,913.912962,False,0.0,False,913.912962 +8cb3e20e-abfe-4be8-ba31-c2613efe1532,openai/gpt-oss-120b,together_ai,feal-linear-cryptanalysis,3110,3233,6343,192.086214,False,0.0,openai/gpt-oss-120b,feal-linear-cryptanalysis,192.086214,False,0.4,False,192.086214 +3347e82c-2042-4df9-a32b-95dda8fd3ed5,gpt-5-nano,openai,code-from-image,19853,19087,38940,1184.555332,False,0.0,gpt-5-nano,code-from-image,1184.555332,False,0.0,False,1184.555332 +7b644390-94b0-4030-adb6-af2419227c78,gpt-5-mini,openai,sanitize-git-repo,9229,7326,16555,900.37908,False,0.0,gpt-5-mini,sanitize-git-repo,900.37908,False,0.0,False,900.37908 +18e99116-2877-467f-beb1-35ef6e60aa20,gemini-2.5-flash,gemini,pypi-server,11920,2351,14271,659.650635,False,0.0,gemini-2.5-flash,pypi-server,659.650635,False,0.0,False,659.650635 +6d490062-4b3f-45a3-8ccb-6464cf9f007c,grok-code-fast-1,xai,build-initramfs-qemu,1399,1246,2645,46.849707,False,0.0,grok-code-fast-1,build-initramfs-qemu,46.849707,False,0.0,False,46.849707 +951447fb-2065-4e01-9858-d6ca408ff24f,gpt-5,openai,dna-assembly,5207,8487,13694,724.760434,False,0.0,gpt-5,dna-assembly,724.760434,False,0.0,False,724.760434 +8b84f7b9-c687-4450-b541-f728a4c46c39,gpt-5-nano,openai,winning-avg-corewars,47147,46626,93773,3609.666848,False,0.0,gpt-5-nano,winning-avg-corewars,3609.666848,False,0.0,False,3609.666848 +13dcf215-3eb1-4998-8420-73dd73409e84,openai/gpt-oss-120b,together_ai,chess-best-move,1882,1253,3135,524.814307,False,0.0,openai/gpt-oss-120b,chess-best-move,524.814307,False,0.0,False,524.814307 +bee9440b-9253-4d69-8da7-b2d6ae9d6cc1,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-klee-minimal,17709,2940,20649,900.066762,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-klee-minimal,900.066762,False,0.0,False,900.066762 +8af4b9ac-dcda-4bf0-aff9-b13947a9ee5c,grok-code-fast-1,xai,git-leak-recovery,1406,1005,2411,123.645644,True,1.0,grok-code-fast-1,git-leak-recovery,123.645644,True,0.2,True,123.645644 +95173a80-8a32-49d7-86ae-5cff8fadef75,claude-sonnet-4-20250514,anthropic,feal-linear-cryptanalysis,24754,23357,48111,1800.008542,False,0.0,claude-sonnet-4-20250514,feal-linear-cryptanalysis,1800.008542,False,0.0,False,1800.008542 +54b89816-ca4e-4d5a-af6a-79b687fc8ddb,claude-sonnet-4-20250514,anthropic,fix-git,3125,2333,5458,199.990105,True,1.0,claude-sonnet-4-20250514,fix-git,199.990105,True,1.0,True,199.990105 +c6ed2b83-0586-4bda-8ec7-9132960f515d,claude-opus-4-1-20250805,anthropic,feal-differential-cryptanalysis,29596,26171,55767,1869.677587,False,0.0,claude-opus-4-1-20250805,feal-differential-cryptanalysis,1869.677587,False,0.0,False,1869.677587 +36de5c8a-60aa-4341-9049-1fdc98684b9d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-startup,1587,1237,2824,985.877287,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-startup,985.877287,False,0.0,False,985.877287 +b05e161c-a86d-4936-ab9c-6ba23a95fe79,gpt-5,openai,password-recovery,10003,10358,20361,901.586461,False,0.0,gpt-5,password-recovery,901.586461,False,0.0,False,901.586461 +35692ba5-269b-42ed-9476-e649ecdaa753,gemini-2.5-pro,gemini,largest-eigenval,7436,6682,14118,913.605252,False,0.0,gemini-2.5-pro,largest-eigenval,913.605252,False,0.0,False,913.605252 +f4c2b1da-0e84-44bc-8a9d-f5285191d55d,claude-opus-4-1-20250805,anthropic,password-recovery,7775,4929,12704,900.000778,False,0.0,claude-opus-4-1-20250805,password-recovery,900.000778,False,0.5555555555555556,False,900.000778 +2d83485b-af72-448b-8644-258d388ba039,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-cli,10262,9540,19802,627.12886,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-cli,627.12886,False,0.0,False,627.12886 +21daf928-d0ec-4df8-b867-b5c1e28357ff,zai-org/GLM-4.5-Air-FP8,together_ai,regex-log,2540,4070,6610,163.981409,False,0.0,zai-org/GLM-4.5-Air-FP8,regex-log,163.981409,False,0.2,False,163.981409 +9fcc9d97-9d54-4400-acd7-c14e2b4fbe10,grok-4-0709,xai,dna-assembly,1152,246,1398,720.096869,False,0.0,grok-4-0709,dna-assembly,720.096869,False,0.0,False,720.096869 +fb214946-32fa-44de-b847-b2475aba59bd,claude-opus-4-1-20250805,anthropic,qemu-alpine-ssh,2454,2358,4812,303.443405,True,1.0,claude-opus-4-1-20250805,qemu-alpine-ssh,303.443405,True,0.8571428571428571,True,303.443405 +749c9a3b-f330-423b-b22c-1dce67dfb7a5,gpt-5-mini,openai,merge-diff-arc-agi-task,4409,5038,9447,906.533537,False,0.0,gpt-5-mini,merge-diff-arc-agi-task,906.533537,False,0.4,False,906.533537 +0ae49add-4c2e-4767-ad43-36288de6dda9,moonshotai/Kimi-K2-Instruct-0905,together_ai,pypi-server,3272,1866,5138,910.536401,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pypi-server,910.536401,False,0.2,False,910.536401 +58c7f7cc-eafd-422d-9c35-a18728eb653d,grok-4-0709,xai,reverse-engineering,4964,2311,7275,1800.96446,False,0.0,grok-4-0709,reverse-engineering,1800.96446,False,0.2,False,1800.96446 +e5471318-1caa-40f6-a2b5-12e33bb82412,gpt-5-nano,openai,path-tracing,1295,888,2183,175.308208,False,0.0,gpt-5-nano,path-tracing,175.308208,False,0.2,False,175.308208 +d758d4fb-cbcf-4979-912e-978e826107a7,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-code-vulnerability,19910,5882,25792,982.605331,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-code-vulnerability,982.605331,False,0.0,False,982.605331 +11e10e32-c808-4617-a5c6-a35438ee25ec,claude-sonnet-4-20250514,anthropic,winning-avg-corewars,23002,20790,43792,1921.203205,False,0.0,claude-sonnet-4-20250514,winning-avg-corewars,1921.203205,False,0.0,False,1921.203205 +d714136b-c860-4e04-9679-f00f0b6db4c0,gpt-5-nano,openai,financial-document-processor,27380,16179,43559,1202.752336,False,0.0,gpt-5-nano,financial-document-processor,1202.752336,False,0.0,False,1202.752336 +de65f11d-d2b3-4458-b327-303bc6cc7d61,claude-opus-4-1-20250805,anthropic,cancel-async-tasks,5762,3549,9311,798.728735,True,1.0,claude-opus-4-1-20250805,cancel-async-tasks,798.728735,True,0.125,True,798.728735 +a3af84d2-1ed8-4293-94ec-a59f23bda1f4,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-with-gcov,9884,2085,11969,912.912405,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-with-gcov,912.912405,False,0.4,False,912.912405 +dcb980fc-3489-45d7-a06e-8364d34ab8f0,openai/gpt-oss-120b,together_ai,sqlite-with-gcov,1213,1020,2233,160.96343,False,0.0,openai/gpt-oss-120b,sqlite-with-gcov,160.96343,False,0.8,False,160.96343 +9d979ae2-3d24-4dd2-88ed-78ff253fa3cb,grok-4-0709,xai,dna-assembly,1154,225,1379,720.005426,False,0.0,grok-4-0709,dna-assembly,720.005426,False,0.0,False,720.005426 +f715ce5e-fe2a-48e1-b230-ae62244908c2,deepseek-ai/DeepSeek-V3.1,together_ai,code-from-image,5600,1982,7582,104.090577,True,1.0,deepseek-ai/DeepSeek-V3.1,code-from-image,104.090577,True,0.6,True,104.090577 +6123c128-f4e2-4575-beb7-18c6d37ac3da,OpenAI/gpt-oss-20B,together_ai,pypi-server,1584,1051,2635,54.839259,False,0.0,OpenAI/gpt-oss-20B,pypi-server,54.839259,False,0.2,False,54.839259 +d2eeb2f5-eed6-418c-8719-d0e731de67a5,OpenAI/gpt-oss-20B,together_ai,path-tracing,323,1641,1964,904.008497,False,0.0,OpenAI/gpt-oss-20B,path-tracing,904.008497,False,0.0,False,904.008497 +acea63b2-219b-4724-a789-b6833632c03c,grok-4-0709,xai,merge-diff-arc-agi-task,8157,2333,10490,581.150503,True,1.0,grok-4-0709,merge-diff-arc-agi-task,581.150503,True,0.4,True,581.150503 +a8681aad-3ca2-47af-b5de-071081dd86d2,gpt-5-nano,openai,qemu-startup,3304,4147,7451,900.401521,False,0.0,gpt-5-nano,qemu-startup,900.401521,False,0.0,False,900.401521 +7f4d951a-b4c0-401d-a745-68e00ce7d4a0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,port-compressor,16227,5054,21281,947.739082,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,port-compressor,947.739082,False,0.0,False,947.739082 +7ec1dc23-8b59-4aec-b92c-399288c85d61,gemini-2.5-pro,gemini,code-from-image,5624,1621,7245,176.713528,True,1.0,gemini-2.5-pro,code-from-image,176.713528,True,1.0,True,176.713528 +3c46035e-92a3-47ac-ba2e-17387b46af4a,zai-org/GLM-4.5-Air-FP8,together_ai,reverse-engineering,23448,15352,38800,1815.027932,False,0.0,zai-org/GLM-4.5-Air-FP8,reverse-engineering,1815.027932,False,0.0,False,1815.027932 +e3dbbb46-2c7c-437b-8581-43761667d6d1,openai/gpt-oss-120b,together_ai,reshard-c4-data,6820,6747,13567,529.4665,False,0.0,openai/gpt-oss-120b,reshard-c4-data,529.4665,False,0.0,False,529.4665 +b2f19a2d-2518-4456-8333-b4046c3d407c,gpt-5,openai,install-windows-3.11,4899,1695,6594,259.88754,False,0.0,gpt-5,install-windows-3.11,259.88754,False,0.0,False,259.88754 +fbd7997a-754f-4649-9ae4-6d6e516dd222,deepseek-ai/DeepSeek-V3.1,together_ai,configure-git-webserver,6011,1642,7653,684.642626,True,1.0,deepseek-ai/DeepSeek-V3.1,configure-git-webserver,684.642626,True,1.0,True,684.642626 +458cca10-69c2-4cc9-90af-b29853ae757a,openai/gpt-oss-120b,together_ai,configure-git-webserver,4062,1191,5253,168.864368,True,1.0,openai/gpt-oss-120b,configure-git-webserver,168.864368,True,0.6,True,168.864368 +51398805-a475-431c-b400-1826c0acf5f1,gemini-2.5-flash,gemini,extract-elf,2022,1730,3752,203.397886,False,0.0,gemini-2.5-flash,extract-elf,203.397886,False,0.4,False,203.397886 +f36962c8-fec8-405e-bd8c-3898e34c5998,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,code-from-image,19776,5613,25389,1204.802094,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,code-from-image,1204.802094,False,0.2,False,1204.802094 +0f06d7df-060d-40e6-89db-9a3eacf6194e,gemini-2.5-pro,gemini,polyglot-rust-c,1687,2229,3916,424.089692,False,0.0,gemini-2.5-pro,polyglot-rust-c,424.089692,False,0.0,False,424.089692 +24fe1f4f-ac82-4a49-997c-b9e0d0279746,gemini-2.5-flash,gemini,winning-avg-corewars,33797,48251,82048,3625.773378,False,0.0,gemini-2.5-flash,winning-avg-corewars,3625.773378,False,0.0,False,3625.773378 +b5befc8d-dabc-4f55-a9aa-b6a13d364079,claude-sonnet-4-20250514,anthropic,prove-plus-comm,2661,2522,5183,448.93355,True,1.0,claude-sonnet-4-20250514,prove-plus-comm,448.93355,True,1.0,True,448.93355 +5aa1749d-6029-4ce2-aec5-ce433919311a,claude-opus-4-1-20250805,anthropic,mteb-retrieve,2348,1671,4019,284.420526,False,0.0,claude-opus-4-1-20250805,mteb-retrieve,284.420526,False,0.0,False,284.420526 +b6ca23b6-7f97-4085-9849-9162911f17ac,gpt-5-mini,openai,tune-mjcf,9989,6681,16670,924.84925,False,0.0,gpt-5-mini,tune-mjcf,924.84925,False,0.0,False,924.84925 +add15559-6664-4fe8-a788-73a20ebdbef3,zai-org/GLM-4.5-Air-FP8,together_ai,tune-mjcf,10119,9681,19800,1041.461925,False,0.0,zai-org/GLM-4.5-Air-FP8,tune-mjcf,1041.461925,False,0.0,False,1041.461925 +3dd95f6a-88a9-41c9-a147-23a38b77569b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cancel-async-tasks,1203,595,1798,178.634469,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cancel-async-tasks,178.634469,True,0.8,True,178.634469 +dce2ba82-f078-4743-b4a8-e1ac0ef5a310,claude-opus-4-1-20250805,anthropic,schemelike-metacircular-eval,32237,29249,61486,2411.786063,False,0.0,claude-opus-4-1-20250805,schemelike-metacircular-eval,2411.786063,False,0.0,False,2411.786063 +da87cd0e-5791-4a97-a839-15b884240b3f,claude-opus-4-1-20250805,anthropic,code-from-image,5468,5384,10852,238.054528,False,0.0,claude-opus-4-1-20250805,code-from-image,238.054528,False,0.125,False,238.054528 +017ee42e-11a5-49c8-8e23-e9abfd41e5a1,gemini-2.5-pro,gemini,sparql-university,4768,2052,6820,197.260861,False,0.0,gemini-2.5-pro,sparql-university,197.260861,False,0.6,False,197.260861 +5758f3f6-7ba3-43a3-927a-2acee10ea356,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,vulnerable-secret,8002,5014,13016,909.040839,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,vulnerable-secret,909.040839,False,0.4,False,909.040839 +e5e25819-3c72-4a40-8beb-4a8dbc7d2eac,claude-opus-4-1-20250805,anthropic,reshard-c4-data,8193,6612,14805,797.980871,False,0.0,claude-opus-4-1-20250805,reshard-c4-data,797.980871,False,0.0,False,797.980871 +531df2f4-5755-46a2-9812-43bdd2f19fec,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pmars,19079,5420,24499,501.241387,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pmars,501.241387,True,0.2,True,501.241387 +9c2fe063-782e-40e1-ae1d-b58d66d2c509,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,prove-plus-comm,4751,5645,10396,900.492358,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,prove-plus-comm,900.492358,False,0.2,False,900.492358 +770daba9-fc1b-472c-ab07-65c8a4ef928a,gpt-5-mini,openai,feal-differential-cryptanalysis,2563,1716,4279,373.724736,False,0.0,gpt-5-mini,feal-differential-cryptanalysis,373.724736,False,0.0,False,373.724736 +2c08e10c-8327-4666-999f-d81220e36c00,moonshotai/Kimi-K2-Instruct-0905,together_ai,sanitize-git-repo,7377,3503,10880,410.238054,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sanitize-git-repo,410.238054,False,0.0,False,410.238054 +ea6755e0-4673-40dd-a376-0b89aca8b8b6,deepseek-ai/DeepSeek-V3.1,together_ai,log-summary-date-ranges,8297,2736,11033,120.690841,False,0.0,deepseek-ai/DeepSeek-V3.1,log-summary-date-ranges,120.690841,False,0.4,False,120.690841 +01e207d2-b71d-43ed-81a8-b8e2c2e71036,deepseek-ai/DeepSeek-V3.1,together_ai,cancel-async-tasks,1953,1245,3198,726.759106,False,0.0,deepseek-ai/DeepSeek-V3.1,cancel-async-tasks,726.759106,False,0.4,False,726.759106 +34334893-efad-4109-9784-d0245a0a8599,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-initramfs-qemu,11851,5588,17439,907.024987,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-initramfs-qemu,907.024987,False,0.0,False,907.024987 +dbafd7d3-b05a-4122-a6eb-4aff4f5429bb,gpt-5-nano,openai,distribution-search,20908,26332,47240,1625.734429,True,1.0,gpt-5-nano,distribution-search,1625.734429,True,0.25,True,1625.734429 +c12acb24-1dfa-477c-9249-3fcfa4dafa15,gpt-5,openai,video-processing,4629,3992,8621,248.232755,False,0.0,gpt-5,video-processing,248.232755,False,0.0,False,248.232755 +71170a6c-0013-4658-9225-e1c911803c0d,OpenAI/gpt-oss-20B,together_ai,cancel-async-tasks,1194,535,1729,18.26774,False,0.0,OpenAI/gpt-oss-20B,cancel-async-tasks,18.26774,False,0.0,False,18.26774 +8ffd3460-8727-4288-8c4c-f07d37e44734,gpt-5,openai,merge-diff-arc-agi-task,7225,5851,13076,755.773528,True,1.0,gpt-5,merge-diff-arc-agi-task,755.773528,True,1.0,True,755.773528 +89d95090-6d65-43aa-bc9f-9d6c29cbdb51,gemini-2.5-pro,gemini,write-compressor,7202,6322,13524,946.373119,False,0.0,gemini-2.5-pro,write-compressor,946.373119,False,0.0,False,946.373119 +12c0dcf6-c511-46a3-b3a8-5426c50b5e9a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,password-recovery,4677,4021,8698,904.441979,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,password-recovery,904.441979,False,0.2,False,904.441979 +0142a589-2275-40dc-83ef-e50cd901e96b,gpt-5-nano,openai,git-leak-recovery,9622,9417,19039,904.121029,False,0.0,gpt-5-nano,git-leak-recovery,904.121029,False,0.0,False,904.121029 +684addef-1aa7-42b2-923c-1ddcd85cd084,openai/gpt-oss-120b,together_ai,pytorch-model-recovery,8104,5621,13725,348.259716,True,1.0,openai/gpt-oss-120b,pytorch-model-recovery,348.259716,True,0.4,True,348.259716 +ee5a7b12-ec19-449f-9741-a330a8f0aff8,claude-sonnet-4-20250514,anthropic,fix-ocaml-gc,50277,25974,76251,3604.199857,False,0.0,claude-sonnet-4-20250514,fix-ocaml-gc,3604.199857,False,0.0,False,3604.199857 +024712d5-2c9b-4b54-b91c-fc41bfba80ce,grok-code-fast-1,xai,write-compressor,3394,1915,5309,1445.626076,False,0.0,grok-code-fast-1,write-compressor,1445.626076,False,0.0,False,1445.626076 +00377d41-cba4-44ff-b3d8-51866886ea96,claude-sonnet-4-20250514,anthropic,build-initramfs-qemu,3911,3685,7596,986.848407,False,0.0,claude-sonnet-4-20250514,build-initramfs-qemu,986.848407,False,0.0,False,986.848407 +24250723-f08e-4070-9f23-c14d7665eb57,gemini-2.5-flash,gemini,largest-eigenval,5300,9729,15029,908.270288,False,0.0,gemini-2.5-flash,largest-eigenval,908.270288,False,0.0,False,908.270288 +fa474802-3795-42c2-8752-b0f71a729c48,zai-org/GLM-4.5-Air-FP8,together_ai,winning-avg-corewars,14757,14636,29393,972.475061,False,0.0,zai-org/GLM-4.5-Air-FP8,winning-avg-corewars,972.475061,False,0.0,False,972.475061 +5623a04b-13fa-490d-9942-b03ff68ac1fc,claude-sonnet-4-20250514,anthropic,git-leak-recovery,3213,2914,6127,389.821232,True,1.0,claude-sonnet-4-20250514,git-leak-recovery,389.821232,True,1.0,True,389.821232 +b88bd526-aea9-4290-91d6-14fa1cd84bf1,OpenAI/gpt-oss-20B,together_ai,fix-code-vulnerability,2885,11167,14052,906.414627,False,0.0,OpenAI/gpt-oss-20B,fix-code-vulnerability,906.414627,False,0.0,False,906.414627 +18d5ce4b-d83a-4733-b994-91112c211f11,moonshotai/Kimi-K2-Instruct-0905,together_ai,constraints-scheduling,4696,3325,8021,474.385982,True,1.0,moonshotai/Kimi-K2-Instruct-0905,constraints-scheduling,474.385982,True,0.6,True,474.385982 +f1ed4354-e3be-4398-b2f4-5651da591e36,grok-code-fast-1,xai,install-windows-3.11,6247,2338,8585,320.577613,False,0.0,grok-code-fast-1,install-windows-3.11,320.577613,False,0.0,False,320.577613 +bfab6d2d-8b17-4530-b95d-706c2cffb57f,claude-opus-4-1-20250805,anthropic,code-from-image,26834,20240,47074,1220.200444,False,0.0,claude-opus-4-1-20250805,code-from-image,1220.200444,False,0.125,False,1220.200444 +a24f81e8-ad4b-4d0f-8af9-0adf522a359e,claude-opus-4-1-20250805,anthropic,port-compressor,62559,38856,101415,3600.594592,False,0.0,claude-opus-4-1-20250805,port-compressor,3600.594592,False,0.0,False,3600.594592 +a9f5326c-69dc-4656-bd6e-cd11e2bc15f1,moonshotai/Kimi-K2-Instruct-0905,together_ai,password-recovery,4120,4787,8907,575.619497,True,1.0,moonshotai/Kimi-K2-Instruct-0905,password-recovery,575.619497,True,0.2,True,575.619497 +70ad6e7e-f0bc-4bc8-9645-13f49bb4aed2,moonshotai/Kimi-K2-Instruct-0905,together_ai,regex-log,15426,13335,28761,845.755794,True,1.0,moonshotai/Kimi-K2-Instruct-0905,regex-log,845.755794,True,0.4,True,845.755794 +38177e56-a04d-43b5-a30a-3268bac4afdc,claude-opus-4-1-20250805,anthropic,build-initramfs-qemu,12117,4212,16329,833.239931,False,0.0,claude-opus-4-1-20250805,build-initramfs-qemu,833.239931,False,0.0,False,833.239931 +94cc043f-9ecf-4557-bbb8-70d1fc7fd678,grok-4-0709,xai,mteb-retrieve,1672,806,2478,295.140364,False,0.0,grok-4-0709,mteb-retrieve,295.140364,False,0.0,False,295.140364 +8ba1e39b-cbed-4f33-857a-86380ab4fb7e,zai-org/GLM-4.5-Air-FP8,together_ai,vulnerable-secret,5479,17265,22744,900.134525,False,0.0,zai-org/GLM-4.5-Air-FP8,vulnerable-secret,900.134525,False,0.0,False,900.134525 +51ae7bb7-3812-4e30-927e-28bf4ff4cf62,gpt-5,openai,circuit-fibsqrt,17293,11104,28397,1431.365257,True,1.0,gpt-5,circuit-fibsqrt,1431.365257,True,0.6666666666666666,True,1431.365257 +5f137981-ac3e-404d-831c-0fefd096fc2f,OpenAI/gpt-oss-20B,together_ai,wasm-pipeline,130,1630,1760,902.181148,False,0.0,OpenAI/gpt-oss-20B,wasm-pipeline,902.181148,False,0.0,False,902.181148 +b015ac8a-4da2-4b05-b6c5-fe3edbcd01d4,deepseek-ai/DeepSeek-V3.1,together_ai,torch-tensor-parallelism,1828,1065,2893,11.058099,False,0.0,deepseek-ai/DeepSeek-V3.1,torch-tensor-parallelism,11.058099,False,0.0,False,11.058099 +f0437214-8b1f-42bd-86cf-480e9fad0f7c,grok-code-fast-1,xai,make-mips-interpreter,16200,16120,32320,613.110449,False,0.0,grok-code-fast-1,make-mips-interpreter,613.110449,False,0.0,False,613.110449 +3dc6ee1d-c738-42df-9d4f-f9ab5105377d,gpt-5,openai,torch-tensor-parallelism,2812,3379,6191,255.797965,False,0.0,gpt-5,torch-tensor-parallelism,255.797965,False,0.0,False,255.797965 +be9428a0-e800-47f4-8348-58c56cf3cd8a,moonshotai/Kimi-K2-Instruct-0905,together_ai,password-recovery,5668,5749,11417,913.523787,False,0.0,moonshotai/Kimi-K2-Instruct-0905,password-recovery,913.523787,False,0.2,False,913.523787 +a01331e5-dea6-4f81-8569-4a7e82ea9aff,gemini-2.5-pro,gemini,log-summary-date-ranges,8852,3316,12168,368.290727,False,0.0,gemini-2.5-pro,log-summary-date-ranges,368.290727,False,0.0,False,368.290727 +24bdd134-0be1-428e-87e9-39b14059ccf1,deepseek-ai/DeepSeek-V3.1,together_ai,install-klee-minimal,16728,1977,18705,904.257814,False,0.0,deepseek-ai/DeepSeek-V3.1,install-klee-minimal,904.257814,False,0.0,False,904.257814 +f51a4346-8c17-499d-8c43-51d22aac2fd5,gemini-2.5-flash,gemini,count-dataset-tokens,7423,2219,9642,386.547217,False,0.0,gemini-2.5-flash,count-dataset-tokens,386.547217,False,0.0,False,386.547217 +fc5b3318-05be-4b14-a2da-dc0bf1354ea1,gpt-5-nano,openai,bn-fit-modify,57195,64124,121319,3637.301526,False,0.0,gpt-5-nano,bn-fit-modify,3637.301526,False,0.0,False,3637.301526 +cd462294-8aa2-4141-9b82-2b07a1034ed0,grok-code-fast-1,xai,polyglot-rust-c,1212,701,1913,276.300903,False,0.0,grok-code-fast-1,polyglot-rust-c,276.300903,False,0.0,False,276.300903 +d4164b69-d8c1-442b-8f5a-60cee6e144d7,gemini-2.5-flash,gemini,reshard-c4-data,3685,3409,7094,332.95525,False,0.0,gemini-2.5-flash,reshard-c4-data,332.95525,False,0.0,False,332.95525 +5242981e-10aa-4a7f-a2d4-64822a4db2af,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,schemelike-metacircular-eval,3188,5154,8342,1296.427146,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,schemelike-metacircular-eval,1296.427146,False,0.0,False,1296.427146 +32a49cbc-4893-42fa-9cb4-e728667d393c,gpt-5,openai,sparql-university,5669,2758,8427,332.210858,True,1.0,gpt-5,sparql-university,332.210858,True,0.8,True,332.210858 +feb1d26d-3c7c-4a92-b120-5c24f019d2b4,deepseek-ai/DeepSeek-V3.1,together_ai,vulnerable-secret,7572,5076,12648,752.382045,True,1.0,deepseek-ai/DeepSeek-V3.1,vulnerable-secret,752.382045,True,0.4,True,752.382045 +217a383a-2133-4d4f-af8e-dedcb8ee110c,gemini-2.5-pro,gemini,make-doom-for-mips,7010,1554,8564,1140.0117,False,0.0,gemini-2.5-pro,make-doom-for-mips,1140.0117,False,0.0,False,1140.0117 +a2281df0-d2df-43cf-8537-04b70c6ed2d1,gemini-2.5-flash,gemini,large-scale-text-editing,2585,1711,4296,109.534043,False,0.0,gemini-2.5-flash,large-scale-text-editing,109.534043,False,0.0,False,109.534043 +075f1854-8fee-4dcd-9aa1-7f288399efbb,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-startup,701,1243,1944,136.411497,True,1.0,zai-org/GLM-4.5-Air-FP8,qemu-startup,136.411497,True,0.2,True,136.411497 +df93a0c1-4a8a-4783-bbde-c745ff4aec67,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-startup,3478,1885,5363,476.429801,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-startup,476.429801,False,0.4,False,476.429801 +7b3b5676-7179-4f92-8fa1-f669f91354c2,claude-sonnet-4-20250514,anthropic,cancel-async-tasks,2253,1612,3865,857.03885,True,1.0,claude-sonnet-4-20250514,cancel-async-tasks,857.03885,True,0.8,True,857.03885 +2660b19a-84a4-4565-a735-807347fc7c0e,gpt-5-mini,openai,video-processing,2709,3569,6278,288.7109,False,0.0,gpt-5-mini,video-processing,288.7109,False,0.0,False,288.7109 +063dbee8-7e63-4b3c-a5eb-5e5623214906,OpenAI/gpt-oss-20B,together_ai,hf-model-inference,1135,2318,3453,156.540089,False,0.0,OpenAI/gpt-oss-20B,hf-model-inference,156.540089,False,0.4,False,156.540089 +a3b290be-abad-4ce2-b8b9-c3e5d3239159,claude-sonnet-4-20250514,anthropic,mteb-retrieve,2818,1990,4808,183.194009,False,0.0,claude-sonnet-4-20250514,mteb-retrieve,183.194009,False,0.0,False,183.194009 +c378e4f4-6428-436f-a9c7-a5a64f70b4b4,gemini-2.5-pro,gemini,feal-linear-cryptanalysis,15432,11415,26847,1408.283413,False,0.0,gemini-2.5-pro,feal-linear-cryptanalysis,1408.283413,False,0.0,False,1408.283413 +9efe4e45-ceec-49f6-8708-d011da533647,gemini-2.5-pro,gemini,configure-git-webserver,5162,975,6137,273.775654,False,0.0,gemini-2.5-pro,configure-git-webserver,273.775654,False,0.0,False,273.775654 +3d291e52-6166-417f-bd3e-9cd296d5dcba,openai/gpt-oss-120b,together_ai,reshard-c4-data,2470,4259,6729,324.155524,False,0.0,openai/gpt-oss-120b,reshard-c4-data,324.155524,False,0.0,False,324.155524 +1ab319e5-6efb-4e51-8a4a-b6322ed9e0ed,grok-code-fast-1,xai,path-tracing-reverse,2040,2048,4088,317.714265,False,0.0,grok-code-fast-1,path-tracing-reverse,317.714265,False,0.0,False,317.714265 +7713e6c5-4b75-44d0-8ea9-eb813fb08e53,moonshotai/Kimi-K2-Instruct-0905,together_ai,reshard-c4-data,10555,6042,16597,403.226755,False,0.0,moonshotai/Kimi-K2-Instruct-0905,reshard-c4-data,403.226755,False,0.0,False,403.226755 +7a63d8dc-80c5-45af-ae0b-cb781a904349,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-cython-ext,15849,6089,21938,802.605653,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-cython-ext,802.605653,False,0.0,False,802.605653 +c6f2ae87-ba96-4961-b7f1-b79b1f0cde6b,gpt-5,openai,build-pov-ray,22275,33534,55809,6000.096154,False,0.0,gpt-5,build-pov-ray,6000.096154,False,0.0,False,6000.096154 +e0605fe4-17b8-4728-81bb-ceef585de0b6,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-windows-3.11,9028,3209,12237,385.069929,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-windows-3.11,385.069929,False,0.0,False,385.069929 +2ea58c60-b0c8-4e9b-a5aa-2f4958ba1bad,OpenAI/gpt-oss-20B,together_ai,fix-code-vulnerability,84,1130,1214,982.462561,False,0.0,OpenAI/gpt-oss-20B,fix-code-vulnerability,982.462561,False,0.0,False,982.462561 +bed5c58a-67a6-4675-8181-9de60c149ca3,grok-4-0709,xai,video-processing,2501,1706,4207,311.753488,False,0.0,grok-4-0709,video-processing,311.753488,False,0.0,False,311.753488 +44278ba4-f261-43c2-8ab6-715e3102d544,grok-4-0709,xai,polyglot-rust-c,0,0,0,906.139468,False,0.0,grok-4-0709,polyglot-rust-c,906.139468,False,0.0,False,906.139468 +f9df35ff-19b3-4af2-abf4-2e04081fcee2,openai/gpt-oss-120b,together_ai,wasm-pipeline,11252,10214,21466,903.444879,False,0.0,openai/gpt-oss-120b,wasm-pipeline,903.444879,False,0.0,False,903.444879 +a30ddbad-c58c-4740-9f6d-1bd05f10734f,gemini-2.5-flash,gemini,db-wal-recovery,6319,14451,20770,900.048317,False,0.0,gemini-2.5-flash,db-wal-recovery,900.048317,False,0.0,False,900.048317 +e3b9b919-ff1e-41ed-9cec-c249ff18ac4e,gpt-5,openai,fix-git,4320,1770,6090,268.257141,True,1.0,gpt-5,fix-git,268.257141,True,1.0,True,268.257141 +6f5d093d-532d-4bd3-8671-32dbd351be28,claude-opus-4-1-20250805,anthropic,regex-log,2946,3050,5996,92.971109,True,1.0,claude-opus-4-1-20250805,regex-log,92.971109,True,0.5714285714285714,True,92.971109 +c537c24f-7017-4b27-b700-0640307d24e4,claude-opus-4-1-20250805,anthropic,circuit-fibsqrt,62092,61828,123920,3606.374705,False,0.0,claude-opus-4-1-20250805,circuit-fibsqrt,3606.374705,False,0.0,False,3606.374705 +1a92c906-f747-415f-babd-2d320d28e92f,grok-4-0709,xai,qemu-startup,1013,546,1559,478.122418,True,1.0,grok-4-0709,qemu-startup,478.122418,True,0.4,True,478.122418 +96a1eea1-5dbb-4812-88d3-ad61d306e395,grok-code-fast-1,xai,password-recovery,5702,1922,7624,1546.922871,False,0.0,grok-code-fast-1,password-recovery,1546.922871,False,0.0,False,1546.922871 +534d4f44-c66f-4e1b-9c66-4d0fe1c6921c,deepseek-ai/DeepSeek-V3.1,together_ai,filter-js-from-html,1667,1035,2702,40.795824,False,0.0,deepseek-ai/DeepSeek-V3.1,filter-js-from-html,40.795824,False,0.0,False,40.795824 +1546dec3-a5bd-4408-8c67-4725f6501921,moonshotai/Kimi-K2-Instruct-0905,together_ai,financial-document-processor,8369,6330,14699,392.163094,False,0.0,moonshotai/Kimi-K2-Instruct-0905,financial-document-processor,392.163094,False,0.0,False,392.163094 +43f4609c-8611-4ded-8bfd-a0f568591a75,gpt-5,openai,pytorch-model-cli,3532,2353,5885,515.502561,False,0.0,gpt-5,pytorch-model-cli,515.502561,False,0.0,False,515.502561 +5433cf05-62ee-421d-98a5-869a8e759388,OpenAI/gpt-oss-20B,together_ai,bn-fit-modify,12334,48165,60499,3603.325587,False,0.0,OpenAI/gpt-oss-20B,bn-fit-modify,3603.325587,False,0.0,False,3603.325587 +5391de27-0405-427e-b375-f08e4d6bc31c,gpt-5-mini,openai,sanitize-git-repo,4429,3287,7716,255.859868,False,0.0,gpt-5-mini,sanitize-git-repo,255.859868,False,0.0,False,255.859868 +77aebeb2-e444-4750-a9aa-5d868a61dc01,grok-code-fast-1,xai,wasm-pipeline,15186,9806,24992,595.729928,True,1.0,grok-code-fast-1,wasm-pipeline,595.729928,True,0.2,True,595.729928 +29e23bc8-878b-463b-8c3b-27f1dfd4ee7a,gemini-2.5-pro,gemini,make-doom-for-mips,17009,4714,21723,903.060768,False,0.0,gemini-2.5-pro,make-doom-for-mips,903.060768,False,0.0,False,903.060768 +1965159e-f932-4aeb-8d8c-d239215dd483,gemini-2.5-flash,gemini,video-processing,5960,3692,9652,163.565985,False,0.0,gemini-2.5-flash,video-processing,163.565985,False,0.0,False,163.565985 +6cd0e534-5058-4a48-876d-0c3556839d7f,OpenAI/gpt-oss-20B,together_ai,vulnerable-secret,1496,4441,5937,911.566206,False,0.0,OpenAI/gpt-oss-20B,vulnerable-secret,911.566206,False,0.0,False,911.566206 +443f9ee5-c3ad-4fa0-8725-22529aa36592,zai-org/GLM-4.5-Air-FP8,together_ai,dna-assembly,24705,21207,45912,644.52054,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-assembly,644.52054,False,0.0,False,644.52054 +004b95f2-95d2-4346-98f1-65de9221a60b,openai/gpt-oss-120b,together_ai,video-processing,1891,1842,3733,62.642712,False,0.0,openai/gpt-oss-120b,video-processing,62.642712,False,0.0,False,62.642712 +ad13e37e-e085-4132-bbc2-427204da9faa,gpt-5,openai,git-leak-recovery,1878,1361,3239,208.594188,True,1.0,gpt-5,git-leak-recovery,208.594188,True,0.7142857142857143,True,208.594188 +2eb2a5c6-a060-4a4e-a0f4-42b8a04e8e2c,OpenAI/gpt-oss-20B,together_ai,fix-ocaml-gc,3865,13984,17849,587.239527,False,0.0,OpenAI/gpt-oss-20B,fix-ocaml-gc,587.239527,False,0.0,False,587.239527 +f002ec63-b254-4a29-91e2-ca2c8cc3ab11,gemini-2.5-pro,gemini,adaptive-rejection-sampler,8163,12656,20819,900.03646,False,0.0,gemini-2.5-pro,adaptive-rejection-sampler,900.03646,False,0.4,False,900.03646 +ba97c69f-8d65-406c-af0c-3628817ed782,gemini-2.5-flash,gemini,cobol-modernization,10822,10424,21246,933.830954,False,0.0,gemini-2.5-flash,cobol-modernization,933.830954,False,0.2,False,933.830954 +063e0a84-f376-4612-aa21-b3b3635d7220,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,wasm-pipeline,13405,9663,23068,819.460915,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,wasm-pipeline,819.460915,True,0.6,True,819.460915 +5734640c-6cbb-457d-b62d-8c4798eb87be,gemini-2.5-flash,gemini,log-summary-date-ranges,4812,3062,7874,171.118966,False,0.0,gemini-2.5-flash,log-summary-date-ranges,171.118966,False,0.0,False,171.118966 +e11be6ad-07a4-4552-8375-4a138ee7911e,claude-opus-4-1-20250805,anthropic,adaptive-rejection-sampler,10364,11486,21850,904.121964,False,0.0,claude-opus-4-1-20250805,adaptive-rejection-sampler,904.121964,False,0.125,False,904.121964 +de14ffb1-1ad4-4839-8200-6e70b0f2ea84,gemini-2.5-flash,gemini,train-fasttext,15199,5372,20571,1332.157481,False,0.0,gemini-2.5-flash,train-fasttext,1332.157481,False,0.0,False,1332.157481 +f2602f60-a204-4ac5-8318-6a3af767cc98,gpt-5,openai,bn-fit-modify,3850,5052,8902,318.920008,False,0.0,gpt-5,bn-fit-modify,318.920008,False,0.5,False,318.920008 +6e59646a-cf75-4889-9f4e-8244174511ea,zai-org/GLM-4.5-Air-FP8,together_ai,reshard-c4-data,10595,4935,15530,310.582633,False,0.0,zai-org/GLM-4.5-Air-FP8,reshard-c4-data,310.582633,False,0.0,False,310.582633 +6bd0cc3b-f75f-41c9-b56f-f0253e395c8a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,filter-js-from-html,3248,1647,4895,81.386927,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,filter-js-from-html,81.386927,False,0.0,False,81.386927 +a0e28d61-75b6-4342-9394-261bbdeafce2,gemini-2.5-flash,gemini,fix-git,5210,2567,7777,190.960504,True,1.0,gemini-2.5-flash,fix-git,190.960504,True,0.8,True,190.960504 +1483dd49-f1e9-4678-ae57-58b5c745a2e6,gpt-5-mini,openai,pypi-server,2853,1564,4417,195.883431,True,1.0,gpt-5-mini,pypi-server,195.883431,True,0.8,True,195.883431 +1987feb4-4849-4179-abb2-cc106198eaf0,grok-4-0709,xai,merge-diff-arc-agi-task,7315,2026,9341,914.198965,False,0.0,grok-4-0709,merge-diff-arc-agi-task,914.198965,False,0.4,False,914.198965 +2b7ca9e1-3e0b-4255-8e8d-1d94ad09ef83,gpt-5-nano,openai,run-pdp11-code,6057,4903,10960,1037.246064,False,0.0,gpt-5-nano,run-pdp11-code,1037.246064,False,0.0,False,1037.246064 +518167f4-76d1-447b-b58f-cd76602fcfbb,openai/gpt-oss-120b,together_ai,bn-fit-modify,2439,1839,4278,194.462602,False,0.0,openai/gpt-oss-120b,bn-fit-modify,194.462602,False,0.2,False,194.462602 +e6da1840-fb0a-4ca6-b4d7-7d60410e7218,claude-opus-4-1-20250805,anthropic,crack-7z-hash,10567,3620,14187,685.795384,True,1.0,claude-opus-4-1-20250805,crack-7z-hash,685.795384,True,0.8888888888888888,True,685.795384 +8f587f5d-0801-4f97-b4f9-19f5b112e74e,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-differential-cryptanalysis,3285,3768,7053,303.201246,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-differential-cryptanalysis,303.201246,False,0.0,False,303.201246 +161c701e-79d9-4b23-8d40-a22ee6984732,moonshotai/Kimi-K2-Instruct-0905,together_ai,large-scale-text-editing,7611,7951,15562,1245.096642,False,0.0,moonshotai/Kimi-K2-Instruct-0905,large-scale-text-editing,1245.096642,False,0.0,False,1245.096642 +8ffd70e1-c0a6-4b76-adf3-92848f6c5f9b,gemini-2.5-pro,gemini,distribution-search,1978,1975,3953,180.449652,False,0.0,gemini-2.5-pro,distribution-search,180.449652,False,0.6,False,180.449652 +fd2c08e5-c249-4ed7-ae2f-47315c6831c3,gemini-2.5-flash,gemini,distribution-search,21908,22743,44651,1122.881936,False,0.0,gemini-2.5-flash,distribution-search,1122.881936,False,0.0,False,1122.881936 +8eff9bc9-5442-46ca-a223-40ecf47af59a,claude-sonnet-4-20250514,anthropic,qemu-startup,7043,8385,15428,905.482006,False,0.0,claude-sonnet-4-20250514,qemu-startup,905.482006,False,0.4,False,905.482006 +84d96793-9bc5-402e-b454-bec71180bfd8,gpt-5-mini,openai,large-scale-text-editing,9007,5971,14978,1222.926937,False,0.0,gpt-5-mini,large-scale-text-editing,1222.926937,False,0.2,False,1222.926937 +16a1bfd6-e77b-4579-9d5e-9f0244a6b98e,claude-sonnet-4-20250514,anthropic,db-wal-recovery,4035,3953,7988,1024.431353,False,0.0,claude-sonnet-4-20250514,db-wal-recovery,1024.431353,False,0.0,False,1024.431353 +87bae500-5a3b-49dc-9328-e36c86f7d831,deepseek-ai/DeepSeek-V3.1,together_ai,extract-elf,6333,3023,9356,319.228374,True,1.0,deepseek-ai/DeepSeek-V3.1,extract-elf,319.228374,True,0.6,True,319.228374 +b78b8f96-a08c-456e-9b19-413560af85c0,gpt-5-mini,openai,fix-code-vulnerability,6585,3421,10006,952.186401,False,0.0,gpt-5-mini,fix-code-vulnerability,952.186401,False,0.0,False,952.186401 +ebc0531f-b318-47c4-90c7-043b67485cc8,OpenAI/gpt-oss-20B,together_ai,prove-plus-comm,978,2340,3318,128.742029,False,0.0,OpenAI/gpt-oss-20B,prove-plus-comm,128.742029,False,0.0,False,128.742029 +3fd05fe6-3ed3-4822-ad45-07c328c4d8d7,claude-sonnet-4-20250514,anthropic,crack-7z-hash,8867,3410,12277,342.291987,True,1.0,claude-sonnet-4-20250514,crack-7z-hash,342.291987,True,1.0,True,342.291987 +493278cb-7d2b-41d7-89a3-6bbcc3368509,gemini-2.5-pro,gemini,large-scale-text-editing,3174,4457,7631,1242.73648,False,0.0,gemini-2.5-pro,large-scale-text-editing,1242.73648,False,0.4,False,1242.73648 +d1ea99a1-4b18-497e-beff-344f90191fc7,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,bn-fit-modify,15723,7110,22833,1137.643445,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,bn-fit-modify,1137.643445,False,0.0,False,1137.643445 +764759d3-7ece-48fe-8d61-3079e4adfb4d,gemini-2.5-pro,gemini,constraints-scheduling,3528,2461,5989,380.134874,True,1.0,gemini-2.5-pro,constraints-scheduling,380.134874,True,1.0,True,380.134874 +ab6108e2-5c89-4b49-a6bb-ab401aa260d6,claude-opus-4-1-20250805,anthropic,build-cython-ext,17048,5945,22993,391.65488,False,0.0,claude-opus-4-1-20250805,build-cython-ext,391.65488,False,0.0,False,391.65488 +f36374c1-4cc5-4fdd-83d8-b731374dedcd,gpt-5-nano,openai,break-filter-js-from-html,10814,11850,22664,1214.065029,False,0.0,gpt-5-nano,break-filter-js-from-html,1214.065029,False,0.0,False,1214.065029 +4c533f4a-105b-4c41-b46f-beb7acf237b4,claude-sonnet-4-20250514,anthropic,fix-code-vulnerability,20366,4137,24503,497.827049,True,1.0,claude-sonnet-4-20250514,fix-code-vulnerability,497.827049,True,0.8,True,497.827049 +9eae2eeb-837c-4e28-a30f-7b8e03c71fc3,gemini-2.5-flash,gemini,adaptive-rejection-sampler,10437,2975,13412,905.959331,False,0.0,gemini-2.5-flash,adaptive-rejection-sampler,905.959331,False,0.0,False,905.959331 +2bc302ce-858c-469e-b020-a19d8072bc85,claude-opus-4-1-20250805,anthropic,git-leak-recovery,3025,1976,5001,230.848446,True,1.0,claude-opus-4-1-20250805,git-leak-recovery,230.848446,True,1.0,True,230.848446 +3d59670f-f03c-4de4-abb8-845522599496,gpt-5,openai,video-processing,6451,4310,10761,278.140621,False,0.0,gpt-5,video-processing,278.140621,False,0.0,False,278.140621 +faa263f1-85a8-4abe-8d2f-e2f6068fbd3d,gemini-2.5-flash,gemini,hf-model-inference,5285,1631,6916,153.094486,True,1.0,gemini-2.5-flash,hf-model-inference,153.094486,True,0.6,True,153.094486 +ecbbd069-5400-4116-b9ac-54260cc9fcd3,gpt-5-mini,openai,adaptive-rejection-sampler,6668,11888,18556,676.379444,True,1.0,gpt-5-mini,adaptive-rejection-sampler,676.379444,True,0.4,True,676.379444 +33a4bf0a-f6e5-4379-bde2-b971cbdf6317,zai-org/GLM-4.5-Air-FP8,together_ai,count-dataset-tokens,13019,3623,16642,920.351024,False,0.0,zai-org/GLM-4.5-Air-FP8,count-dataset-tokens,920.351024,False,0.0,False,920.351024 +9dbc4e35-7a0c-4fc8-97d6-752f323d4045,gpt-5-mini,openai,sqlite-db-truncate,3062,3877,6939,338.799654,False,0.0,gpt-5-mini,sqlite-db-truncate,338.799654,False,0.0,False,338.799654 +3e901893-2123-490c-899a-5eff7e3d63a5,OpenAI/gpt-oss-20B,together_ai,port-compressor,7169,24861,32030,3618.353702,False,0.0,OpenAI/gpt-oss-20B,port-compressor,3618.353702,False,0.0,False,3618.353702 +c0807dc8-ca09-4521-aefe-851e5f7b66ba,grok-4-0709,xai,bn-fit-modify,17530,7864,25394,3038.932611,True,1.0,grok-4-0709,bn-fit-modify,3038.932611,True,0.6,True,3038.932611 +ba2a9cc4-23bc-4476-886f-9e5fd5327577,gemini-2.5-flash,gemini,feal-differential-cryptanalysis,5049,33989,39038,431.355964,False,0.0,gemini-2.5-flash,feal-differential-cryptanalysis,431.355964,False,0.2,False,431.355964 +51e5b942-8cac-49cc-a3b4-de1d565c6078,grok-code-fast-1,xai,reshard-c4-data,1778,2883,4661,209.462943,False,0.0,grok-code-fast-1,reshard-c4-data,209.462943,False,0.0,False,209.462943 +0e8eb221-0ed3-4301-b90e-7c14d7552466,claude-opus-4-1-20250805,anthropic,build-cython-ext,18489,5754,24243,355.528366,False,0.0,claude-opus-4-1-20250805,build-cython-ext,355.528366,False,0.0,False,355.528366 +5c2bd8d4-a671-4439-88ea-2938c391e038,claude-sonnet-4-20250514,anthropic,sqlite-db-truncate,5273,4152,9425,396.272263,False,0.0,claude-sonnet-4-20250514,sqlite-db-truncate,396.272263,False,0.0,False,396.272263 +bd7d739f-98b2-4161-b93d-da3aaf622bec,zai-org/GLM-4.5-Air-FP8,together_ai,dna-assembly,18889,9937,28826,531.922187,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-assembly,531.922187,False,0.0,False,531.922187 +4196183f-9885-4780-91c0-5569a87cd7b3,gemini-2.5-pro,gemini,regex-log,1402,699,2101,109.631906,True,1.0,gemini-2.5-pro,regex-log,109.631906,True,0.8,True,109.631906 +11934b09-7fb4-4fb4-97d9-ded874403ba5,gemini-2.5-pro,gemini,large-scale-text-editing,1950,1166,3116,414.049017,True,1.0,gemini-2.5-pro,large-scale-text-editing,414.049017,True,0.4,True,414.049017 +e19214c7-11e0-4d3c-be5f-60e01bac3915,grok-4-0709,xai,wasm-pipeline,7841,2936,10777,510.127774,False,0.0,grok-4-0709,wasm-pipeline,510.127774,False,0.4,False,510.127774 +4b204004-32c6-4344-aa67-cb8b31b93f32,grok-4-0709,xai,vulnerable-secret,1821,1970,3791,901.390157,False,0.0,grok-4-0709,vulnerable-secret,901.390157,False,0.6,False,901.390157 +0e261ee6-9a2b-403e-9689-ee95fca29725,claude-opus-4-1-20250805,anthropic,fix-code-vulnerability,27866,14289,42155,645.203066,False,0.0,claude-opus-4-1-20250805,fix-code-vulnerability,645.203066,False,0.125,False,645.203066 +96af64fe-5703-4aa1-8d21-eaed8b288382,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sparql-university,7664,4693,12357,345.050973,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sparql-university,345.050973,False,0.0,False,345.050973 +403e777c-5c65-4e6c-b11b-4f4baf37c48f,claude-opus-4-1-20250805,anthropic,torch-tensor-parallelism,2598,1811,4409,88.331873,False,0.0,claude-opus-4-1-20250805,torch-tensor-parallelism,88.331873,False,0.0,False,88.331873 +08aa8b62-6dfb-4abe-8dbb-a2e8d79d0bb9,claude-opus-4-1-20250805,anthropic,largest-eigenval,14258,11150,25408,901.361522,False,0.0,claude-opus-4-1-20250805,largest-eigenval,901.361522,False,0.25,False,901.361522 +7ec961ee-caa6-48d0-92af-a669881b3746,OpenAI/gpt-oss-20B,together_ai,mteb-leaderboard,936,229,1165,29.463283,False,0.0,OpenAI/gpt-oss-20B,mteb-leaderboard,29.463283,False,0.0,False,29.463283 +74dc8e27-bf5f-4947-bb54-3b618dcadb16,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing-reverse,48934,18613,67547,1585.560612,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing-reverse,1585.560612,False,0.0,False,1585.560612 +91f654ec-4ff6-4ed0-9ae9-5ce504a14ad7,gpt-5,openai,feal-differential-cryptanalysis,3762,3595,7357,523.144905,False,0.0,gpt-5,feal-differential-cryptanalysis,523.144905,False,0.0,False,523.144905 +acbe80b2-aabe-4c09-aae7-6905c0c66816,moonshotai/Kimi-K2-Instruct-0905,together_ai,financial-document-processor,22122,7633,29755,538.449639,False,0.0,moonshotai/Kimi-K2-Instruct-0905,financial-document-processor,538.449639,False,0.0,False,538.449639 +8930e099-3045-4cb6-b040-0a8b467e92fb,gemini-2.5-pro,gemini,build-cython-ext,16263,5791,22054,596.690821,False,0.0,gemini-2.5-pro,build-cython-ext,596.690821,False,0.0,False,596.690821 +c3fdf7a2-5574-4425-a528-fbecb571513f,gpt-5-nano,openai,nginx-request-logging,5692,8030,13722,900.624736,False,0.0,gpt-5-nano,nginx-request-logging,900.624736,False,0.0,False,900.624736 +e4702c73-23fe-4201-82fe-620d5476ae24,gpt-5-nano,openai,model-extraction-relu-logits,3711,3168,6879,281.321433,False,0.0,gpt-5-nano,model-extraction-relu-logits,281.321433,False,0.0,False,281.321433 +addd0bd5-a563-49f6-a282-6c99346f08d9,claude-opus-4-1-20250805,anthropic,regex-log,3396,2595,5991,368.250988,False,0.0,claude-opus-4-1-20250805,regex-log,368.250988,False,0.5714285714285714,False,368.250988 +c6d53bb7-5b70-4dfe-a7fe-cfb32ed99f50,zai-org/GLM-4.5-Air-FP8,together_ai,crack-7z-hash,16728,13238,29966,900.266514,False,0.0,zai-org/GLM-4.5-Air-FP8,crack-7z-hash,900.266514,False,0.0,False,900.266514 +123eeeab-4f1e-4f0a-8ee0-ef6f88a82f5f,openai/gpt-oss-120b,together_ai,make-doom-for-mips,13377,4876,18253,907.782117,False,0.0,openai/gpt-oss-120b,make-doom-for-mips,907.782117,False,0.0,False,907.782117 +24edb57e-b515-4450-817f-dbb41af0cf48,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,winning-avg-corewars,15408,17155,32563,2908.69855,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,winning-avg-corewars,2908.69855,False,0.0,False,2908.69855 +ca4e8210-a4ff-40b8-afbd-5516276e3eee,moonshotai/Kimi-K2-Instruct-0905,together_ai,port-compressor,68782,38314,107096,1299.824652,False,0.0,moonshotai/Kimi-K2-Instruct-0905,port-compressor,1299.824652,False,0.0,False,1299.824652 +f247293e-2088-4069-80d1-263a5dfec96a,claude-opus-4-1-20250805,anthropic,wasm-pipeline,7719,2635,10354,224.428482,False,0.0,claude-opus-4-1-20250805,wasm-pipeline,224.428482,False,0.1428571428571428,False,224.428482 +c886dc20-b62b-4425-94e2-f1486061badf,grok-code-fast-1,xai,code-from-image,7281,4843,12124,343.988905,False,0.0,grok-code-fast-1,code-from-image,343.988905,False,0.0,False,343.988905 +46d89796-e6d7-415e-b8d0-5f3f3d938aaf,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,filter-js-from-html,6095,2642,8737,611.113985,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,filter-js-from-html,611.113985,False,0.0,False,611.113985 +03c9965e-f232-4a99-9540-c9a41c6f9148,gpt-5-mini,openai,gpt2-codegolf,1485,1123,2608,124.154593,False,0.0,gpt-5-mini,gpt2-codegolf,124.154593,False,0.0,False,124.154593 +54403f84-3b58-48c6-909c-010287f2e715,gpt-5-mini,openai,pytorch-model-cli,1852,1319,3171,124.677858,False,0.0,gpt-5-mini,pytorch-model-cli,124.677858,False,0.0,False,124.677858 +a0813987-5035-4d27-a162-59491d1d7e73,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-with-gcov,6665,2581,9246,168.923934,True,1.0,zai-org/GLM-4.5-Air-FP8,sqlite-with-gcov,168.923934,True,0.6,True,168.923934 +00090459-c21f-452f-a6e4-d5d5847522e8,moonshotai/Kimi-K2-Instruct-0905,together_ai,run-pdp11-code,10270,9022,19292,681.128358,False,0.0,moonshotai/Kimi-K2-Instruct-0905,run-pdp11-code,681.128358,False,0.0,False,681.128358 +862e23e7-1faa-46ce-9977-5ad58a44800e,claude-opus-4-1-20250805,anthropic,vulnerable-secret,4317,4451,8768,900.001458,False,0.0,claude-opus-4-1-20250805,vulnerable-secret,900.001458,False,0.625,False,900.001458 +458baed0-2b9d-4a50-97cf-f5c4261ce38e,gemini-2.5-flash,gemini,db-wal-recovery,2605,3892,6497,332.896125,False,0.0,gemini-2.5-flash,db-wal-recovery,332.896125,False,0.0,False,332.896125 +e6f23cad-9881-4526-9dd7-9b907bbe37fb,grok-code-fast-1,xai,make-doom-for-mips,12746,3756,16502,589.842526,False,0.0,grok-code-fast-1,make-doom-for-mips,589.842526,False,0.0,False,589.842526 +ef7c7d72-684c-42a7-a40f-1afbdbaab05d,OpenAI/gpt-oss-20B,together_ai,count-dataset-tokens,3301,8674,11975,902.607654,False,0.0,OpenAI/gpt-oss-20B,count-dataset-tokens,902.607654,False,0.0,False,902.607654 +fb6af8fe-c9b4-4a19-8989-26886ce467e2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,chess-best-move,1934,2040,3974,78.995028,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,chess-best-move,78.995028,False,0.0,False,78.995028 +25aa4e25-852a-4e78-8936-a9ed8d107b26,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-with-gcov,11147,2893,14040,692.336752,True,1.0,zai-org/GLM-4.5-Air-FP8,sqlite-with-gcov,692.336752,True,0.6,True,692.336752 +b11a9242-99d6-447c-ac66-423240bb92fc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-leaderboard,2312,1570,3882,281.57408,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-leaderboard,281.57408,False,0.0,False,281.57408 +2b027ad8-265c-4035-ac8e-7715cd96bceb,deepseek-ai/DeepSeek-V3.1,together_ai,vulnerable-secret,7462,8771,16233,535.583917,False,0.0,deepseek-ai/DeepSeek-V3.1,vulnerable-secret,535.583917,False,0.4,False,535.583917 +1ebe098c-b6ab-4abd-bcc1-6963cb5f3af5,moonshotai/Kimi-K2-Instruct-0905,together_ai,video-processing,8894,6410,15304,388.241618,False,0.0,moonshotai/Kimi-K2-Instruct-0905,video-processing,388.241618,False,0.0,False,388.241618 +120fc17b-a4a6-44d3-8086-4ab7ff3a8508,OpenAI/gpt-oss-20B,together_ai,circuit-fibsqrt,1023,3352,4375,285.791206,False,0.0,OpenAI/gpt-oss-20B,circuit-fibsqrt,285.791206,False,0.0,False,285.791206 +05b61be6-aea8-4ff2-8c72-680cbb811d9b,claude-sonnet-4-20250514,anthropic,feal-differential-cryptanalysis,25242,24503,49745,1816.288025,False,0.0,claude-sonnet-4-20250514,feal-differential-cryptanalysis,1816.288025,False,0.0,False,1816.288025 +17474b49-b197-4cd7-ad39-1cfb51b5b867,gemini-2.5-flash,gemini,model-extraction-relu-logits,4960,6358,11318,900.415638,False,0.0,gemini-2.5-flash,model-extraction-relu-logits,900.415638,False,0.2,False,900.415638 +5a9b04fb-eba8-4f4b-a193-2c333963598c,gemini-2.5-pro,gemini,feal-differential-cryptanalysis,3120,2391,5511,496.416113,True,1.0,gemini-2.5-pro,feal-differential-cryptanalysis,496.416113,True,0.6,True,496.416113 +e5c89fd6-b828-4922-958c-6445b54e0699,gpt-5,openai,polyglot-rust-c,859,972,1831,938.261047,False,0.0,gpt-5,polyglot-rust-c,938.261047,False,0.0,False,938.261047 +c5821718-9037-426b-a94f-43df426362a8,openai/gpt-oss-120b,together_ai,form-filling,4582,3074,7656,68.063662,True,1.0,openai/gpt-oss-120b,form-filling,68.063662,True,0.6,True,68.063662 +718c03e7-ba95-482f-a555-a8596b738b5c,openai/gpt-oss-120b,together_ai,prove-plus-comm,1366,822,2188,41.834069,True,1.0,openai/gpt-oss-120b,prove-plus-comm,41.834069,True,1.0,True,41.834069 +0ff3f69b-56b5-454c-994e-edbbedef3979,claude-sonnet-4-20250514,anthropic,model-extraction-relu-logits,8774,6551,15325,368.724788,False,0.0,claude-sonnet-4-20250514,model-extraction-relu-logits,368.724788,False,0.0,False,368.724788 +f4299ba2-0bce-4100-8ec2-e682b85c30a2,gpt-5-nano,openai,vulnerable-secret,3385,2961,6346,924.125589,False,0.0,gpt-5-nano,vulnerable-secret,924.125589,False,0.2,False,924.125589 +540275ce-c236-41ad-bd36-1aff908fa555,zai-org/GLM-4.5-Air-FP8,together_ai,dna-insert,2942,3747,6689,379.011423,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-insert,379.011423,False,0.0,False,379.011423 +1bde948b-4128-4100-9baf-08bdc84b8be2,gemini-2.5-flash,gemini,make-doom-for-mips,14200,6508,20708,910.993634,False,0.0,gemini-2.5-flash,make-doom-for-mips,910.993634,False,0.0,False,910.993634 +50cb1a63-0aa0-4785-ae16-d365d5db67e6,gpt-5-mini,openai,build-cython-ext,6727,2750,9477,940.840837,False,0.0,gpt-5-mini,build-cython-ext,940.840837,False,0.2,False,940.840837 +a648dfae-38b0-446d-88c0-ff179e335af1,zai-org/GLM-4.5-Air-FP8,together_ai,largest-eigenval,10082,9062,19144,900.375306,False,0.0,zai-org/GLM-4.5-Air-FP8,largest-eigenval,900.375306,False,0.0,False,900.375306 +b3550fce-5075-475f-8e97-3c1f16b8db77,claude-opus-4-1-20250805,anthropic,gpt2-codegolf,1232,2008,3240,1018.917097,False,0.0,claude-opus-4-1-20250805,gpt2-codegolf,1018.917097,False,0.0,False,1018.917097 +cc51af98-1dce-45a1-8249-d05c8445e2f6,moonshotai/Kimi-K2-Instruct-0905,together_ai,financial-document-processor,21218,15465,36683,1175.052338,False,0.0,moonshotai/Kimi-K2-Instruct-0905,financial-document-processor,1175.052338,False,0.0,False,1175.052338 +c1b78f68-50ac-470a-82f1-468534ae49bd,moonshotai/Kimi-K2-Instruct-0905,together_ai,tune-mjcf,9745,10247,19992,904.245024,False,0.0,moonshotai/Kimi-K2-Instruct-0905,tune-mjcf,904.245024,False,0.4,False,904.245024 +571e0561-859a-44d1-8f66-9f99bd3c0cf3,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cobol-modernization,15366,11284,26650,835.953787,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cobol-modernization,835.953787,False,0.0,False,835.953787 +1254d544-f93a-4598-a42a-ced14dbcab43,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,regex-log,1365,809,2174,625.376828,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,regex-log,625.376828,False,0.0,False,625.376828 +53384d0b-c0fe-455d-aec6-0dccdcf3516b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-c-py,5819,2879,8698,276.795469,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-c-py,276.795469,False,0.0,False,276.795469 +7834d5ab-94f9-4788-86ae-8f87782982cc,claude-opus-4-1-20250805,anthropic,pytorch-model-cli,6693,5069,11762,494.763512,False,0.0,claude-opus-4-1-20250805,pytorch-model-cli,494.763512,False,0.4285714285714285,False,494.763512 +781c84a8-c6da-41b7-9e61-50c700a288ba,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,financial-document-processor,11831,5182,17013,890.061216,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,financial-document-processor,890.061216,False,0.0,False,890.061216 +0d0bb73f-14e6-46c7-bd37-aefdad3d17ab,gpt-5-mini,openai,largest-eigenval,13011,14085,27096,900.195707,False,0.0,gpt-5-mini,largest-eigenval,900.195707,False,0.0,False,900.195707 +b8945bb2-965f-41c1-a835-4b2f25e4a9c8,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-rust-c,8570,10477,19047,900.006148,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-rust-c,900.006148,False,0.0,False,900.006148 +f79ce026-eb9b-4345-8080-0e7dacc9bffb,gpt-5-mini,openai,run-pdp11-code,2429,1331,3760,222.067762,False,0.0,gpt-5-mini,run-pdp11-code,222.067762,False,0.0,False,222.067762 +079e5015-34b3-4245-96a2-9b06d49fb7af,claude-opus-4-1-20250805,anthropic,nginx-request-logging,5097,2368,7465,129.801722,True,1.0,claude-opus-4-1-20250805,nginx-request-logging,129.801722,True,1.0,True,129.801722 +875fe2f9-879b-49d3-aea9-9a875ea7c4d5,gemini-2.5-pro,gemini,merge-diff-arc-agi-task,8488,2796,11284,301.771479,True,1.0,gemini-2.5-pro,merge-diff-arc-agi-task,301.771479,True,0.6,True,301.771479 +1f8d1ebd-1a70-4a76-ab8a-53c91ac2ad7f,gemini-2.5-flash,gemini,distribution-search,11209,38516,49725,3600.560965,False,0.0,gemini-2.5-flash,distribution-search,3600.560965,False,0.0,False,3600.560965 +a5b643b9-76f1-455a-855f-fa5f5f06da6c,grok-code-fast-1,xai,winning-avg-corewars,9812,6597,16409,1438.55769,False,0.0,grok-code-fast-1,winning-avg-corewars,1438.55769,False,0.0,False,1438.55769 +0c0f13f4-ec56-40ca-bbcb-20b0cc7c6bc9,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,hf-model-inference,4509,1983,6492,925.986945,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,hf-model-inference,925.986945,False,0.0,False,925.986945 +d4c39c15-85d3-49f1-8f42-ee7522eaef00,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-insert,2978,2063,5041,373.498096,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-insert,373.498096,False,0.0,False,373.498096 +d9eca115-e0c3-463d-98b2-a9dc24bf7b3f,openai/gpt-oss-120b,together_ai,build-cython-ext,6544,2540,9084,900.472911,False,0.0,openai/gpt-oss-120b,build-cython-ext,900.472911,False,0.0,False,900.472911 +a952debc-fabe-4421-9ef7-053739177604,grok-code-fast-1,xai,distribution-search,2415,1376,3791,267.021554,False,0.0,grok-code-fast-1,distribution-search,267.021554,False,0.0,False,267.021554 +415e363c-8a81-4ce3-98a9-52cd0be7d093,moonshotai/Kimi-K2-Instruct-0905,together_ai,regex-log,4334,3035,7369,272.557405,False,0.0,moonshotai/Kimi-K2-Instruct-0905,regex-log,272.557405,False,0.4,False,272.557405 +1b927bd5-a0d3-4364-b630-1f7e80fd9e28,OpenAI/gpt-oss-20B,together_ai,large-scale-text-editing,5354,15476,20830,1238.868658,False,0.0,OpenAI/gpt-oss-20B,large-scale-text-editing,1238.868658,False,0.0,False,1238.868658 +4becdaf2-ded7-4b93-b3d1-2a0197f8e31a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-insert,5411,893,6304,374.011014,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-insert,374.011014,False,0.0,False,374.011014 +d69ca7d1-2fd8-4f4e-95d1-6a1c66bf68fe,claude-opus-4-1-20250805,anthropic,crack-7z-hash,15457,4872,20329,581.434339,True,1.0,claude-opus-4-1-20250805,crack-7z-hash,581.434339,True,0.8888888888888888,True,581.434339 +13b4dd5d-b1f8-4e05-9fb3-6163378efb24,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-startup,1734,1989,3723,224.649714,False,0.0,moonshotai/Kimi-K2-Instruct-0905,qemu-startup,224.649714,False,0.4,False,224.649714 +fa031b00-8bc5-42f2-af84-2cdd01663a9a,moonshotai/Kimi-K2-Instruct-0905,together_ai,prove-plus-comm,2121,1624,3745,394.415537,True,1.0,moonshotai/Kimi-K2-Instruct-0905,prove-plus-comm,394.415537,True,0.8,True,394.415537 +92af63b5-7b45-41cb-b64d-f5d2ce424461,openai/gpt-oss-120b,together_ai,dna-insert,18836,10812,29648,373.07906,False,0.0,openai/gpt-oss-120b,dna-insert,373.07906,False,0.0,False,373.07906 +bae9db50-5600-4448-aea3-91ab014cbe7e,gpt-5-mini,openai,wasm-pipeline,10973,8026,18999,318.65126,True,1.0,gpt-5-mini,wasm-pipeline,318.65126,True,0.6,True,318.65126 +f668dff4-7763-4ed2-82d4-6ba8e462bf1e,deepseek-ai/DeepSeek-V3.1,together_ai,constraints-scheduling,4923,2867,7790,253.174731,False,0.0,deepseek-ai/DeepSeek-V3.1,constraints-scheduling,253.174731,False,0.8,False,253.174731 +4f5b7a2a-8051-4fcd-bb1d-ba1bd243b33c,gemini-2.5-pro,gemini,cancel-async-tasks,1110,562,1672,72.256043,False,0.0,gemini-2.5-pro,cancel-async-tasks,72.256043,False,0.0,False,72.256043 +18cefb64-eb87-4470-a1f6-a728fd04db81,gpt-5-mini,openai,fix-git,3811,1604,5415,151.432391,False,0.0,gpt-5-mini,fix-git,151.432391,False,0.6,False,151.432391 +474e9c2c-4df7-4ce5-b8bf-3d529dd73476,zai-org/GLM-4.5-Air-FP8,together_ai,password-recovery,2858,6866,9724,902.199165,False,0.0,zai-org/GLM-4.5-Air-FP8,password-recovery,902.199165,False,0.0,False,902.199165 +867a3f48-f7ac-46ce-90ee-e8b99b9108a3,deepseek-ai/DeepSeek-V3.1,together_ai,prove-plus-comm,2230,1668,3898,158.454283,True,1.0,deepseek-ai/DeepSeek-V3.1,prove-plus-comm,158.454283,True,1.0,True,158.454283 +e8de320d-ce85-4649-b046-e500b7fe7cfc,claude-sonnet-4-20250514,anthropic,dna-assembly,11836,7791,19627,748.965164,False,0.0,claude-sonnet-4-20250514,dna-assembly,748.965164,False,0.0,False,748.965164 +b64ff970-4482-46ec-8071-b241fa3ac2dc,openai/gpt-oss-120b,together_ai,polyglot-rust-c,543,871,1414,141.29147,False,0.0,openai/gpt-oss-120b,polyglot-rust-c,141.29147,False,0.0,False,141.29147 +4d5ff12b-68ee-44cb-81a9-dbed85895112,grok-4-0709,xai,sqlite-with-gcov,9829,1606,11435,482.71818,False,0.0,grok-4-0709,sqlite-with-gcov,482.71818,False,0.0,False,482.71818 +3efe6916-87ec-4504-a41f-579d3ef31013,claude-opus-4-1-20250805,anthropic,git-leak-recovery,2304,1599,3903,80.871534,True,1.0,claude-opus-4-1-20250805,git-leak-recovery,80.871534,True,1.0,True,80.871534 +0b5bdcac-a289-43e1-a0c2-d67b6c50d789,openai/gpt-oss-120b,together_ai,build-pmars,5638,3154,8792,915.518592,False,0.0,openai/gpt-oss-120b,build-pmars,915.518592,False,0.2,False,915.518592 +4c299126-2de4-4b35-9483-008d62c86533,gpt-5,openai,qemu-startup,2435,2867,5302,920.1992,False,0.0,gpt-5,qemu-startup,920.1992,False,0.8,False,920.1992 +74f22536-99cd-4868-a42f-729d38d9557a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,port-compressor,75384,26885,102269,3600.006561,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,port-compressor,3600.006561,False,0.0,False,3600.006561 +aac3df65-1bf8-4494-82b7-f5f75aee8695,gpt-5-nano,openai,financial-document-processor,26724,19215,45939,1200.108211,False,0.0,gpt-5-nano,financial-document-processor,1200.108211,False,0.0,False,1200.108211 +2c1a6033-8906-48c7-9701-78aa1714f30a,grok-code-fast-1,xai,feal-linear-cryptanalysis,13513,9376,22889,777.650423,False,0.0,grok-code-fast-1,feal-linear-cryptanalysis,777.650423,False,0.0,False,777.650423 +0dd6db81-a42f-4608-892d-64d3c445067f,claude-sonnet-4-20250514,anthropic,mteb-leaderboard,1137,880,2017,60.790112,False,0.0,claude-sonnet-4-20250514,mteb-leaderboard,60.790112,False,0.0,False,60.790112 +e254e52e-f245-4916-9fe4-c0fe15f0a6c1,gemini-2.5-flash,gemini,polyglot-rust-c,1204,4876,6080,900.939822,False,0.0,gemini-2.5-flash,polyglot-rust-c,900.939822,False,0.0,False,900.939822 +9081549d-9bef-4a44-b0fe-f5e760f1e4cb,claude-opus-4-1-20250805,anthropic,feal-linear-cryptanalysis,24319,24973,49292,1800.509458,False,0.0,claude-opus-4-1-20250805,feal-linear-cryptanalysis,1800.509458,False,0.0,False,1800.509458 +12fd4ea7-602b-454c-a88f-0d59b7a7c358,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-rust-c,19817,26671,46488,900.103093,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-rust-c,900.103093,False,0.0,False,900.103093 +9c192dbc-56df-4298-91be-9eb1866eebd6,claude-sonnet-4-20250514,anthropic,chess-best-move,7075,7396,14471,765.37166,False,0.0,claude-sonnet-4-20250514,chess-best-move,765.37166,False,0.0,False,765.37166 +deb156e6-22a8-48cc-a753-bef7546cf845,zai-org/GLM-4.5-Air-FP8,together_ai,feal-differential-cryptanalysis,13678,12248,25926,799.657608,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-differential-cryptanalysis,799.657608,False,0.0,False,799.657608 +a2443d3a-6a5f-47ab-bfd9-871ed26d94f5,gemini-2.5-pro,gemini,large-scale-text-editing,1780,1022,2802,238.957385,True,1.0,gemini-2.5-pro,large-scale-text-editing,238.957385,True,0.4,True,238.957385 +163b20ee-9fc2-45b5-8aae-a3624e1837f0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,constraints-scheduling,13629,13286,26915,702.942225,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,constraints-scheduling,702.942225,True,1.0,True,702.942225 +7c3f8538-4107-41eb-925b-c9bccea0e5a2,gpt-5-nano,openai,feal-linear-cryptanalysis,29327,31161,60488,1800.110598,False,0.0,gpt-5-nano,feal-linear-cryptanalysis,1800.110598,False,0.0,False,1800.110598 +4d787dea-0d61-4670-bdaa-ae25753d3785,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-linear-cryptanalysis,12250,16598,28848,1805.750966,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-linear-cryptanalysis,1805.750966,False,0.0,False,1805.750966 +f2032e58-77e6-40c7-95f0-2a63dbfe0eb2,gpt-5-nano,openai,sparql-university,14488,10097,24585,907.096685,False,0.0,gpt-5-nano,sparql-university,907.096685,False,0.0,False,907.096685 +f7208ee3-1cda-4070-892d-204c5b8d6e3c,OpenAI/gpt-oss-20B,together_ai,largest-eigenval,651,2904,3555,210.989092,False,0.0,OpenAI/gpt-oss-20B,largest-eigenval,210.989092,False,0.0,False,210.989092 +0bad16b2-12e7-4559-8263-1f5a1bb08fce,gpt-5-nano,openai,adaptive-rejection-sampler,5019,3186,8205,332.455199,False,0.0,gpt-5-nano,adaptive-rejection-sampler,332.455199,False,0.2,False,332.455199 +94437be0-6127-4e60-9d04-0ab1ce858c18,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-c-py,19605,17115,36720,900.017569,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-c-py,900.017569,False,0.0,False,900.017569 +00a6522b-53a9-4afd-ab14-5ac298d3ed7d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pov-ray,27806,8000,35806,3105.266429,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pov-ray,3105.266429,False,0.2,False,3105.266429 +e31f7c5b-fcf2-4b90-925a-60b2ddce2a18,gpt-5,openai,run-pdp11-code,5430,4873,10303,534.175527,False,0.0,gpt-5,run-pdp11-code,534.175527,False,0.0,False,534.175527 +0bd10e96-f7cb-4d56-b1e7-6453483922a1,gemini-2.5-pro,gemini,feal-linear-cryptanalysis,14767,22820,37587,1802.292989,False,0.0,gemini-2.5-pro,feal-linear-cryptanalysis,1802.292989,False,0.0,False,1802.292989 +a0e2fc2b-6448-43c3-a8c4-20d68f9401ae,openai/gpt-oss-120b,together_ai,hf-model-inference,3426,1024,4450,112.271213,False,0.0,openai/gpt-oss-120b,hf-model-inference,112.271213,False,0.0,False,112.271213 +3b8a6da2-13c5-4ab8-be7b-bbbf279aeae4,claude-opus-4-1-20250805,anthropic,train-fasttext,31781,12716,44497,3646.901448,False,0.0,claude-opus-4-1-20250805,train-fasttext,3646.901448,False,0.2857142857142857,False,3646.901448 +4133e8c0-bf92-4b53-9436-3ddec9417aad,claude-opus-4-1-20250805,anthropic,gpt2-codegolf,11547,11803,23350,900.149939,False,0.0,claude-opus-4-1-20250805,gpt2-codegolf,900.149939,False,0.0,False,900.149939 +9c1fbb70-5c2d-401b-bc44-a2b25e744687,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,gpt2-codegolf,8036,7247,15283,384.661556,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,gpt2-codegolf,384.661556,False,0.0,False,384.661556 +edee0c76-d82a-46ae-957f-c8308f041175,claude-opus-4-1-20250805,anthropic,path-tracing,31794,22745,54539,1859.136666,False,0.0,claude-opus-4-1-20250805,path-tracing,1859.136666,False,0.0,False,1859.136666 +86ea8d23-553c-4389-8d31-94f5fcac083e,zai-org/GLM-4.5-Air-FP8,together_ai,large-scale-text-editing,13852,10038,23890,1211.805926,False,0.0,zai-org/GLM-4.5-Air-FP8,large-scale-text-editing,1211.805926,False,0.0,False,1211.805926 +35b5fddf-7745-455a-a57a-503f7f61e8f1,gpt-5-nano,openai,filter-js-from-html,1520,1028,2548,123.623545,False,0.0,gpt-5-nano,filter-js-from-html,123.623545,False,0.0,False,123.623545 +638fa9f7-fd43-4f40-a0a9-222a248993db,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,merge-diff-arc-agi-task,23401,11133,34534,900.460495,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,merge-diff-arc-agi-task,900.460495,False,0.0,False,900.460495 +0952b483-f724-4859-954f-ee6ab4bfad53,openai/gpt-oss-120b,together_ai,configure-git-webserver,6395,2141,8536,295.40014,True,1.0,openai/gpt-oss-120b,configure-git-webserver,295.40014,True,0.6,True,295.40014 +3fb77c08-0ac4-45f4-9067-0f4e658855f3,deepseek-ai/DeepSeek-V3.1,together_ai,schemelike-metacircular-eval,26609,26709,53318,2407.670819,False,0.0,deepseek-ai/DeepSeek-V3.1,schemelike-metacircular-eval,2407.670819,False,0.0,False,2407.670819 +f1f9f9b3-6288-4fa2-bc31-945f240193f3,openai/gpt-oss-120b,together_ai,feal-linear-cryptanalysis,8734,21148,29882,1800.858603,False,0.0,openai/gpt-oss-120b,feal-linear-cryptanalysis,1800.858603,False,0.4,False,1800.858603 +55f63ef5-dfcf-4386-9686-5be567cf5f32,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-doom-for-mips,18779,6281,25060,907.866592,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-doom-for-mips,907.866592,False,0.0,False,907.866592 +1c2a993b-c6b6-4ea1-bbd8-166d05ac01c3,gemini-2.5-pro,gemini,model-extraction-relu-logits,2237,1957,4194,229.467774,False,0.0,gemini-2.5-pro,model-extraction-relu-logits,229.467774,False,0.0,False,229.467774 +03ba89f0-1269-4708-a57f-2b6881a16b5b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-cython-ext,20338,5285,25623,901.228377,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-cython-ext,901.228377,False,0.0,False,901.228377 +cf934e81-c8ea-43fb-bc7d-79b384b90e57,zai-org/GLM-4.5-Air-FP8,together_ai,prove-plus-comm,10162,13400,23562,912.975059,False,0.0,zai-org/GLM-4.5-Air-FP8,prove-plus-comm,912.975059,False,0.8,False,912.975059 +1ecbe457-d3d2-45cd-91e3-7b2a8b3b576d,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-retrieve,3038,1320,4358,185.611729,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-retrieve,185.611729,False,0.0,False,185.611729 +5642bbdb-5db2-4b69-b0d0-15460143bda9,gpt-5-nano,openai,hf-model-inference,8962,5737,14699,355.19306,True,1.0,gpt-5-nano,hf-model-inference,355.19306,True,0.4,True,355.19306 +021f04d4-4b5a-4be4-9059-ed79174016fc,openai/gpt-oss-120b,together_ai,run-pdp11-code,4316,2961,7277,202.563766,False,0.0,openai/gpt-oss-120b,run-pdp11-code,202.563766,False,0.0,False,202.563766 +e7a28c2d-e4a6-4bba-afad-04134ea4b4e5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,hf-model-inference,3325,2309,5634,102.926319,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,hf-model-inference,102.926319,True,0.8,True,102.926319 +b8c6dc20-6abe-424a-9e90-9c479900ef23,grok-code-fast-1,xai,reshard-c4-data,5009,3324,8333,228.425349,False,0.0,grok-code-fast-1,reshard-c4-data,228.425349,False,0.0,False,228.425349 +7412edec-d8f6-4226-9342-f5053ebcb1a4,zai-org/GLM-4.5-Air-FP8,together_ai,wasm-pipeline,3239,3996,7235,124.992499,False,0.0,zai-org/GLM-4.5-Air-FP8,wasm-pipeline,124.992499,False,0.2,False,124.992499 +1f9dd107-1318-4a1d-8898-c40995b6d292,OpenAI/gpt-oss-20B,together_ai,reshard-c4-data,2441,2908,5349,125.623363,False,0.0,OpenAI/gpt-oss-20B,reshard-c4-data,125.623363,False,0.0,False,125.623363 +6214e46a-4b19-4ce0-8fe2-9c7fa20366ca,gemini-2.5-flash,gemini,fix-git,2888,1969,4857,120.301791,True,1.0,gemini-2.5-flash,fix-git,120.301791,True,0.8,True,120.301791 +7f85acbc-0f96-41c0-bbd7-1c79c3bdef0e,grok-code-fast-1,xai,pypi-server,4035,1972,6007,358.658308,True,1.0,grok-code-fast-1,pypi-server,358.658308,True,0.8,True,358.658308 +6c714c28-5c82-47fc-887b-1d7a48ebc385,gpt-5-mini,openai,video-processing,3272,3233,6505,251.469578,False,0.0,gpt-5-mini,video-processing,251.469578,False,0.0,False,251.469578 +654f15a3-eb15-4b57-a050-e1d6eef6129e,gpt-5-mini,openai,extract-elf,2404,3443,5847,210.088688,True,1.0,gpt-5-mini,extract-elf,210.088688,True,0.6,True,210.088688 +e9a5541d-2044-482b-8a7d-30debd7e6eba,grok-4-0709,xai,build-cython-ext,13133,6122,19255,904.099153,False,0.0,grok-4-0709,build-cython-ext,904.099153,False,0.0,False,904.099153 +33f71961-78c3-4225-a260-731a037cb298,moonshotai/Kimi-K2-Instruct-0905,together_ai,reverse-engineering,23522,20988,44510,1811.558149,False,0.0,moonshotai/Kimi-K2-Instruct-0905,reverse-engineering,1811.558149,False,0.2,False,1811.558149 +9567cfd5-d7bf-489d-a188-251650d35caf,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,hf-model-inference,7036,3211,10247,342.102901,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,hf-model-inference,342.102901,False,0.0,False,342.102901 +01abbe71-2473-4587-bb75-bfe815f7ab5d,claude-opus-4-1-20250805,anthropic,torch-tensor-parallelism,2302,1697,3999,50.283946,False,0.0,claude-opus-4-1-20250805,torch-tensor-parallelism,50.283946,False,0.0,False,50.283946 +81fbbbc2-d765-42f2-8f1b-3c0f6f238e0a,grok-4-0709,xai,distribution-search,1181,1665,2846,439.210163,False,0.0,grok-4-0709,distribution-search,439.210163,False,0.4,False,439.210163 +201e3378-70f0-4bef-b329-73601ef2bc7d,gpt-5,openai,write-compressor,1953,2496,4449,906.284959,False,0.0,gpt-5,write-compressor,906.284959,False,0.3333333333333333,False,906.284959 +63ac2895-a7c5-483d-a577-165dc14fb79f,grok-code-fast-1,xai,cancel-async-tasks,1114,949,2063,165.10426,False,0.0,grok-code-fast-1,cancel-async-tasks,165.10426,False,0.2,False,165.10426 +c200ee65-6142-4bae-9d20-bea5f910505b,OpenAI/gpt-oss-20B,together_ai,dna-insert,1272,1414,2686,372.228474,False,0.0,OpenAI/gpt-oss-20B,dna-insert,372.228474,False,0.0,False,372.228474 +4ad19b08-5854-4974-bbe5-64e5328a55d8,OpenAI/gpt-oss-20B,together_ai,configure-git-webserver,873,1307,2180,149.752211,False,0.0,OpenAI/gpt-oss-20B,configure-git-webserver,149.752211,False,0.2,False,149.752211 +f1890747-ce51-4666-9ff1-658eeb017b38,grok-4-0709,xai,constraints-scheduling,4592,3913,8505,1202.244716,False,0.0,grok-4-0709,constraints-scheduling,1202.244716,False,0.8,False,1202.244716 +f8e30418-bb33-495b-a1e3-a44906c15318,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,distribution-search,19687,11754,31441,3600.129881,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,distribution-search,3600.129881,False,0.0,False,3600.129881 +a0d29ae7-835f-4fb4-8de4-076a8d10dba3,zai-org/GLM-4.5-Air-FP8,together_ai,configure-git-webserver,2452,3856,6308,300.760405,False,0.0,zai-org/GLM-4.5-Air-FP8,configure-git-webserver,300.760405,False,0.0,False,300.760405 +e7375bf0-2717-40e4-a96f-fda52d20e679,gpt-5-nano,openai,pytorch-model-recovery,7114,10874,17988,909.594941,False,0.0,gpt-5-nano,pytorch-model-recovery,909.594941,False,0.0,False,909.594941 +6cedb864-dfdd-4b8c-8c2b-f133a68c9811,gpt-5-mini,openai,circuit-fibsqrt,34027,57487,91514,3605.65617,False,0.0,gpt-5-mini,circuit-fibsqrt,3605.65617,False,0.0,False,3605.65617 +8ebd1b27-ddc6-4609-9260-53052f563d16,gpt-5-mini,openai,git-leak-recovery,4272,3900,8172,994.094624,False,0.0,gpt-5-mini,git-leak-recovery,994.094624,False,0.0,False,994.094624 +8629563b-b5c9-4598-8c11-351a55eea5e5,gemini-2.5-pro,gemini,video-processing,3030,2742,5772,168.156932,False,0.0,gemini-2.5-pro,video-processing,168.156932,False,0.0,False,168.156932 +61155f11-74de-4682-b4a8-60fb74609b47,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-recovery,18685,9306,27991,644.098194,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-recovery,644.098194,False,0.0,False,644.098194 +1a528372-4f54-40e6-92f3-b4f8f5db7fa7,claude-sonnet-4-20250514,anthropic,mteb-retrieve,2637,1841,4478,326.787733,False,0.0,claude-sonnet-4-20250514,mteb-retrieve,326.787733,False,0.0,False,326.787733 +967648d1-efad-453d-80f4-7bc2233b80ec,gpt-5-mini,openai,build-pmars,4215,4185,8400,903.912323,False,0.0,gpt-5-mini,build-pmars,903.912323,False,0.2,False,903.912323 +46146ca3-5f7a-4caa-bb8d-47b4c5c578e9,gpt-5-nano,openai,openssl-selfsigned-cert,5119,4987,10106,292.403505,True,1.0,gpt-5-nano,openssl-selfsigned-cert,292.403505,True,0.6,True,292.403505 +dc7b00c1-2147-4661-80c8-e69303f139c9,gpt-5-nano,openai,polyglot-c-py,7709,6482,14191,595.425073,False,0.0,gpt-5-nano,polyglot-c-py,595.425073,False,0.0,False,595.425073 +90e9dde5-ba53-40b8-9429-5899f7cff37b,grok-code-fast-1,xai,dna-assembly,6519,1782,8301,197.337656,False,0.0,grok-code-fast-1,dna-assembly,197.337656,False,0.0,False,197.337656 +225cdc57-9105-4e38-a05c-d0fc666c5d48,claude-opus-4-1-20250805,anthropic,pypi-server,5368,2363,7731,245.695786,True,1.0,claude-opus-4-1-20250805,pypi-server,245.695786,True,1.0,True,245.695786 +bdfa877a-433c-4afb-a33b-ce1d239fc818,gpt-5-mini,openai,qemu-alpine-ssh,4867,5969,10836,900.116404,False,0.0,gpt-5-mini,qemu-alpine-ssh,900.116404,False,0.0,False,900.116404 +1a05eaf9-8fa0-456c-8ccc-111218efa518,OpenAI/gpt-oss-20B,together_ai,tune-mjcf,953,2922,3875,129.569055,False,0.0,OpenAI/gpt-oss-20B,tune-mjcf,129.569055,False,0.0,False,129.569055 +d6ee15ac-03ea-4629-b73d-e7bc053282c9,gpt-5,openai,openssl-selfsigned-cert,1993,1288,3281,94.043205,True,1.0,gpt-5,openssl-selfsigned-cert,94.043205,True,1.0,True,94.043205 +55410dd9-1fd8-4661-8e32-d09b7948300d,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sparql-university,2319,2196,4515,929.961259,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sparql-university,929.961259,False,0.0,False,929.961259 +e4a7bb49-11fd-484b-a315-3def68640f46,openai/gpt-oss-120b,together_ai,polyglot-rust-c,2096,10721,12817,906.844519,False,0.0,openai/gpt-oss-120b,polyglot-rust-c,906.844519,False,0.0,False,906.844519 +45ef3e22-0c00-4e15-8cb7-174143623546,claude-sonnet-4-20250514,anthropic,sanitize-git-repo,11245,3697,14942,906.840565,False,0.0,claude-sonnet-4-20250514,sanitize-git-repo,906.840565,False,0.0,False,906.840565 +f8d8f335-00ed-461d-bac5-fdad6d3d6857,deepseek-ai/DeepSeek-V3.1,together_ai,form-filling,6116,4288,10404,207.304221,True,1.0,deepseek-ai/DeepSeek-V3.1,form-filling,207.304221,True,0.8,True,207.304221 +889967a4-8c41-482a-8daf-f679f80b049c,claude-sonnet-4-20250514,anthropic,password-recovery,3765,4923,8688,864.163425,True,1.0,claude-sonnet-4-20250514,password-recovery,864.163425,True,0.4,True,864.163425 +353f49dd-306d-4e36-9cd3-4f420cec1a14,OpenAI/gpt-oss-20B,together_ai,train-fasttext,912,2046,2958,267.011545,False,0.0,OpenAI/gpt-oss-20B,train-fasttext,267.011545,False,0.0,False,267.011545 +06265101-16a5-4857-9202-ecf3934fec1e,gemini-2.5-flash,gemini,nginx-request-logging,7585,15621,23206,900.089541,False,0.0,gemini-2.5-flash,nginx-request-logging,900.089541,False,0.0,False,900.089541 +313343a4-9165-4387-9b77-41bd26100869,gpt-5,openai,sanitize-git-repo,15261,4103,19364,350.852476,True,1.0,gpt-5,sanitize-git-repo,350.852476,True,0.2857142857142857,True,350.852476 +a0124f49-0031-49e3-8ba6-19596f24831c,gemini-2.5-pro,gemini,make-mips-interpreter,31200,56939,88139,1813.991046,False,0.0,gemini-2.5-pro,make-mips-interpreter,1813.991046,False,0.0,False,1813.991046 +b9ec74d3-3538-4eed-925e-c746b037b41b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,torch-tensor-parallelism,2595,1921,4516,264.292741,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,torch-tensor-parallelism,264.292741,False,0.0,False,264.292741 +270fff03-dd54-4da2-8a11-0404be30a5ab,claude-opus-4-1-20250805,anthropic,dna-assembly,15419,9568,24987,728.300629,False,0.0,claude-opus-4-1-20250805,dna-assembly,728.300629,False,0.0,False,728.300629 +2a44b8e0-c44d-4d28-91f6-f48ded348133,zai-org/GLM-4.5-Air-FP8,together_ai,fix-code-vulnerability,20474,10769,31243,503.604219,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-code-vulnerability,503.604219,False,0.0,False,503.604219 +151073a2-a54b-4f6e-8442-b7fbf8ed6d8b,OpenAI/gpt-oss-20B,together_ai,adaptive-rejection-sampler,214,2766,2980,133.689527,False,0.0,OpenAI/gpt-oss-20B,adaptive-rejection-sampler,133.689527,False,0.0,False,133.689527 +393aecfc-6744-4752-9862-b9ee75b6321d,gpt-5-mini,openai,sqlite-with-gcov,1985,1111,3096,244.830021,True,1.0,gpt-5-mini,sqlite-with-gcov,244.830021,True,1.0,True,244.830021 +cf8fc772-27ef-46c5-a0ef-c98b3aa84484,grok-code-fast-1,xai,feal-differential-cryptanalysis,2515,1765,4280,165.958678,False,0.0,grok-code-fast-1,feal-differential-cryptanalysis,165.958678,False,0.0,False,165.958678 +0eeefc2e-c78d-4a36-b887-ca0fc0f0e4f9,gpt-5-mini,openai,torch-tensor-parallelism,3383,2237,5620,93.839999,False,0.0,gpt-5-mini,torch-tensor-parallelism,93.839999,False,0.0,False,93.839999 +365a54ec-e6b1-4c0d-811b-bdc50aabc9da,gemini-2.5-pro,gemini,db-wal-recovery,10812,5247,16059,906.509691,False,0.0,gemini-2.5-pro,db-wal-recovery,906.509691,False,0.0,False,906.509691 +880f477a-f11e-4e47-abda-9aecf2538b26,gemini-2.5-pro,gemini,openssl-selfsigned-cert,2658,1971,4629,187.011159,True,1.0,gemini-2.5-pro,openssl-selfsigned-cert,187.011159,True,0.6,True,187.011159 +c29606d9-d129-4004-8c1c-fed9af885f20,gemini-2.5-pro,gemini,bn-fit-modify,26052,15995,42047,2057.063295,False,0.0,gemini-2.5-pro,bn-fit-modify,2057.063295,False,0.0,False,2057.063295 +a39acfd1-92df-4f23-be2b-f8d34b95e99d,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-c-py,1880,2358,4238,58.540728,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-c-py,58.540728,False,0.0,False,58.540728 +db491ae0-036a-49f5-bb19-7c77938c054f,gpt-5-nano,openai,chess-best-move,20438,11223,31661,900.808594,False,0.0,gpt-5-nano,chess-best-move,900.808594,False,0.0,False,900.808594 +420bd9ae-c0b3-4f5d-9d4c-a2eb37dedc52,gemini-2.5-flash,gemini,torch-tensor-parallelism,1899,1148,3047,106.718819,False,0.0,gemini-2.5-flash,torch-tensor-parallelism,106.718819,False,0.0,False,106.718819 +595e69cb-bf16-42f2-ba4c-b9a66299fcec,gpt-5-mini,openai,extract-elf,1821,1186,3007,227.823148,False,0.0,gpt-5-mini,extract-elf,227.823148,False,0.6,False,227.823148 +f17520ad-0263-46b5-b001-99fd9003db9c,claude-sonnet-4-20250514,anthropic,cancel-async-tasks,2647,2094,4741,214.053384,True,1.0,claude-sonnet-4-20250514,cancel-async-tasks,214.053384,True,0.8,True,214.053384 +df04802d-c892-4a9c-bceb-4987130145fd,gpt-5,openai,wasm-pipeline,7964,7908,15872,697.914905,True,1.0,gpt-5,wasm-pipeline,697.914905,True,1.0,True,697.914905 +be43eefc-bb79-400a-800b-f91bac6bacdf,gpt-5-nano,openai,sqlite-with-gcov,11701,4408,16109,430.979574,True,1.0,gpt-5-nano,sqlite-with-gcov,430.979574,True,0.6,True,430.979574 +b59f150b-8b59-4d24-98f5-6d999fb75cab,gpt-5-mini,openai,chess-best-move,15452,6666,22118,904.543426,False,0.0,gpt-5-mini,chess-best-move,904.543426,False,0.0,False,904.543426 +aef94f94-62d5-4af6-b099-ee82ba5e0c03,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing,1980,1399,3379,90.968048,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing,90.968048,False,0.0,False,90.968048 +73b85c2f-0203-4d56-a4a0-5da30bdad1fe,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,adaptive-rejection-sampler,11308,7721,19029,916.269919,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,adaptive-rejection-sampler,916.269919,False,0.0,False,916.269919 +7bb4f3b9-9ed2-4419-9f81-964eb277c6af,gemini-2.5-pro,gemini,build-pmars,12438,4550,16988,425.277691,True,1.0,gemini-2.5-pro,build-pmars,425.277691,True,1.0,True,425.277691 +e7f6165f-9db7-434c-ac63-ee63fba32ab9,gpt-5-mini,openai,install-windows-3.11,4626,2469,7095,266.145285,False,0.0,gpt-5-mini,install-windows-3.11,266.145285,False,0.0,False,266.145285 +1e21f7c9-b966-4bd0-b874-3775bddaf2b1,gpt-5,openai,make-doom-for-mips,7783,8348,16131,900.002286,False,0.0,gpt-5,make-doom-for-mips,900.002286,False,0.0,False,900.002286 +4284deef-8436-4a92-9185-205bf3cacbde,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,git-leak-recovery,2433,1775,4208,116.743747,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,git-leak-recovery,116.743747,True,1.0,True,116.743747 +3300c18c-ecca-4ad4-9967-1669897be8ee,gpt-5-nano,openai,break-filter-js-from-html,8289,10885,19174,1254.933754,False,0.0,gpt-5-nano,break-filter-js-from-html,1254.933754,False,0.0,False,1254.933754 +b776f559-18fb-4c91-ab52-06d2231e58dc,zai-org/GLM-4.5-Air-FP8,together_ai,schemelike-metacircular-eval,24783,24953,49736,905.561927,False,0.0,zai-org/GLM-4.5-Air-FP8,schemelike-metacircular-eval,905.561927,False,0.0,False,905.561927 +a108b9a0-292e-4e37-8760-48a66deff06d,gpt-5,openai,make-doom-for-mips,7889,4122,12011,906.463231,False,0.0,gpt-5,make-doom-for-mips,906.463231,False,0.0,False,906.463231 +8b18dedb-1aec-4eb7-88ad-b1eb1c9cc167,deepseek-ai/DeepSeek-V3.1,together_ai,reverse-engineering,31670,15940,47610,1805.682187,False,0.0,deepseek-ai/DeepSeek-V3.1,reverse-engineering,1805.682187,False,0.2,False,1805.682187 +958ed9ca-4650-43b3-8ba0-f86f0f4c20ec,claude-sonnet-4-20250514,anthropic,largest-eigenval,3817,2867,6684,906.091434,False,0.0,claude-sonnet-4-20250514,largest-eigenval,906.091434,False,0.0,False,906.091434 +eb508604-8ad6-438c-98fc-e5fcbb9f99c5,gpt-5-mini,openai,build-pmars,15843,5162,21005,604.95726,True,1.0,gpt-5-mini,build-pmars,604.95726,True,0.2,True,604.95726 +30e53f46-c864-4daa-9f4f-f53179e3b3a8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,video-processing,3051,2397,5448,347.069534,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,video-processing,347.069534,False,0.0,False,347.069534 +0f6a60dd-f49e-42e8-9efc-001126ec6763,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-leaderboard,1772,1526,3298,150.642923,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-leaderboard,150.642923,False,0.0,False,150.642923 +c2ccdb5e-8a42-4a1a-9708-4511877bc04b,grok-code-fast-1,xai,financial-document-processor,6903,1919,8822,295.970427,False,0.0,grok-code-fast-1,financial-document-processor,295.970427,False,0.0,False,295.970427 +31b3becc-2ea4-4486-9d57-7441e852c7e0,grok-4-0709,xai,chess-best-move,9364,1772,11136,911.377773,False,0.0,grok-4-0709,chess-best-move,911.377773,False,0.0,False,911.377773 +f18235ff-1fd3-4b74-af46-28fe7cffa977,claude-sonnet-4-20250514,anthropic,chess-best-move,11539,7712,19251,747.189363,False,0.0,claude-sonnet-4-20250514,chess-best-move,747.189363,False,0.0,False,747.189363 +835a0073-3d85-44db-87d2-4f72b5ff4bfe,gpt-5-nano,openai,build-cython-ext,6117,2293,8410,919.813052,False,0.0,gpt-5-nano,build-cython-ext,919.813052,False,0.0,False,919.813052 +e34312a2-c0e0-4b20-aa22-52fe9ca8bc63,zai-org/GLM-4.5-Air-FP8,together_ai,largest-eigenval,16121,15660,31781,900.005405,False,0.0,zai-org/GLM-4.5-Air-FP8,largest-eigenval,900.005405,False,0.0,False,900.005405 +5812557d-5e3b-4f9b-9375-105da96b6e64,gpt-5-mini,openai,filter-js-from-html,2032,2553,4585,231.185136,False,0.0,gpt-5-mini,filter-js-from-html,231.185136,False,0.0,False,231.185136 +7e4071e9-b597-48a8-bab7-d761c0744c30,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-code-vulnerability,5512,1485,6997,1062.355889,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-code-vulnerability,1062.355889,False,0.0,False,1062.355889 +6a1aa59a-44c7-4f6c-9cad-4cdcf271d4df,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,vulnerable-secret,3019,2255,5274,302.983967,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,vulnerable-secret,302.983967,False,0.0,False,302.983967 +aa86d76f-f732-4af2-b931-56fa8c29cbff,moonshotai/Kimi-K2-Instruct-0905,together_ai,tune-mjcf,6716,6650,13366,935.342423,False,0.0,moonshotai/Kimi-K2-Instruct-0905,tune-mjcf,935.342423,False,0.4,False,935.342423 +a16185be-39fb-4cd9-8ec8-a7c0a2697e3a,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-c-py,37732,23657,61389,919.667277,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-c-py,919.667277,False,0.0,False,919.667277 +b12512ca-5ec4-4f1c-849a-16e15eee4ee2,gemini-2.5-flash,gemini,crack-7z-hash,8302,6271,14573,605.059823,False,0.0,gemini-2.5-flash,crack-7z-hash,605.059823,False,0.8,False,605.059823 +36ea7088-bfc1-47d5-bb8c-3ee8b1a24501,claude-opus-4-1-20250805,anthropic,fix-git,2809,1825,4634,69.302587,True,1.0,claude-opus-4-1-20250805,fix-git,69.302587,True,1.0,True,69.302587 +65b3bfb9-c51d-47e5-beff-20be74796049,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,crack-7z-hash,2932,1362,4294,109.678749,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,crack-7z-hash,109.678749,False,0.0,False,109.678749 +2dd96148-0cb9-443c-9ec0-98f42ab69b82,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,large-scale-text-editing,6403,6337,12740,708.316535,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,large-scale-text-editing,708.316535,False,0.0,False,708.316535 +c4357ef5-fce0-4ac9-b1e7-6475f44322eb,grok-4-0709,xai,train-fasttext,21722,11103,32825,3646.909724,False,0.0,grok-4-0709,train-fasttext,3646.909724,False,0.2,False,3646.909724 +3b091743-9d58-4880-a98a-afdf2fd0a4ed,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-alpine-ssh,3510,4426,7936,904.12361,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-alpine-ssh,904.12361,False,0.2,False,904.12361 +299add31-1e46-41ad-92d8-8ca2a9e27ea2,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-cli,18416,6797,25213,435.326062,False,0.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-cli,435.326062,False,0.0,False,435.326062 +0295b1eb-f9b3-473f-b936-a8bf02c59d81,gemini-2.5-pro,gemini,fix-git,4824,1562,6386,143.803245,True,1.0,gemini-2.5-pro,fix-git,143.803245,True,1.0,True,143.803245 +3678bd85-6fd1-44a1-a741-2bd13d1bfd43,moonshotai/Kimi-K2-Instruct-0905,together_ai,adaptive-rejection-sampler,14367,7147,21514,900.33538,False,0.0,moonshotai/Kimi-K2-Instruct-0905,adaptive-rejection-sampler,900.33538,False,0.0,False,900.33538 +2d534205-5b7c-49a3-82c4-4d22f8373a39,gemini-2.5-pro,gemini,wasm-pipeline,10591,3726,14317,415.427435,False,0.0,gemini-2.5-pro,wasm-pipeline,415.427435,False,0.0,False,415.427435 +118d8122-b389-4dae-ab44-9c4ac8e97334,claude-opus-4-1-20250805,anthropic,large-scale-text-editing,5025,4026,9051,816.861871,True,1.0,claude-opus-4-1-20250805,large-scale-text-editing,816.861871,True,0.6666666666666666,True,816.861871 +a771d2b7-bd6c-4254-a1ea-cad7f7725e5e,gpt-5,openai,schemelike-metacircular-eval,8994,36938,45932,2400.99404,False,0.0,gpt-5,schemelike-metacircular-eval,2400.99404,False,0.0,False,2400.99404 +e7beaccf-489a-4aab-b96f-2bc53f170894,gemini-2.5-pro,gemini,fix-code-vulnerability,8912,5442,14354,790.776486,False,0.0,gemini-2.5-pro,fix-code-vulnerability,790.776486,False,0.2,False,790.776486 +71fef181-990a-4f97-94b4-1c39ea66e95c,gpt-5-mini,openai,cancel-async-tasks,1852,1364,3216,119.079362,True,1.0,gpt-5-mini,cancel-async-tasks,119.079362,True,0.4,True,119.079362 +fd71404b-c7e4-478f-9e7c-b27d47186994,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-c-py,3065,2150,5215,78.489297,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-c-py,78.489297,False,0.0,False,78.489297 +ee7c1a0e-5cf3-48da-a381-fdff2d3f3d77,zai-org/GLM-4.5-Air-FP8,together_ai,git-leak-recovery,2667,3181,5848,369.341489,True,1.0,zai-org/GLM-4.5-Air-FP8,git-leak-recovery,369.341489,True,0.8,True,369.341489 +fc4cfd33-df42-4460-916c-27d847a43da8,grok-4-0709,xai,run-pdp11-code,3544,3354,6898,1023.539085,False,0.0,grok-4-0709,run-pdp11-code,1023.539085,False,0.0,False,1023.539085 +9bd387da-9efa-4fd7-a3e7-28af561bc6a5,gpt-5-mini,openai,nginx-request-logging,3813,1725,5538,335.965284,False,0.0,gpt-5-mini,nginx-request-logging,335.965284,False,0.4,False,335.965284 +68db99b7-51c6-4ea6-a594-d3044733dc58,grok-4-0709,xai,install-windows-3.11,6422,2371,8793,512.911126,False,0.0,grok-4-0709,install-windows-3.11,512.911126,False,0.0,False,512.911126 +46b54077-f5eb-4df0-9539-85367512ebe8,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-with-gcov,9740,2128,11868,198.423864,True,1.0,zai-org/GLM-4.5-Air-FP8,sqlite-with-gcov,198.423864,True,0.6,True,198.423864 +193e57c9-2515-419b-ba43-c099fa13b2be,deepseek-ai/DeepSeek-V3.1,together_ai,build-pov-ray,26208,12415,38623,2338.508084,True,1.0,deepseek-ai/DeepSeek-V3.1,build-pov-ray,2338.508084,True,0.4,True,2338.508084 +1565a4e7-7ff6-4d47-abe5-8e095aef4f2a,gemini-2.5-pro,gemini,pypi-server,6193,3265,9458,825.17696,True,1.0,gemini-2.5-pro,pypi-server,825.17696,True,0.8,True,825.17696 +d8b301eb-5d59-425d-a649-589ae869175b,gemini-2.5-pro,gemini,train-fasttext,23757,6928,30685,3601.985707,False,0.0,gemini-2.5-pro,train-fasttext,3601.985707,False,0.0,False,3601.985707 +d66b8d7e-a5be-4a25-8167-317f2024d192,grok-code-fast-1,xai,merge-diff-arc-agi-task,12066,5469,17535,910.407648,False,0.0,grok-code-fast-1,merge-diff-arc-agi-task,910.407648,False,0.8,False,910.407648 +1fd89e02-aeb6-4c55-b52c-159ec614e3ef,gpt-5,openai,nginx-request-logging,5031,2637,7668,504.06337,True,1.0,gpt-5,nginx-request-logging,504.06337,True,1.0,True,504.06337 +65618365-9d10-4eb3-b9c1-31053a1273fb,gpt-5-mini,openai,dna-insert,962,3322,4284,453.338066,False,0.0,gpt-5-mini,dna-insert,453.338066,False,0.0,False,453.338066 +77d98bf1-2fd1-4540-9bd6-80e189de6cee,gpt-5-mini,openai,cobol-modernization,5035,2807,7842,665.606813,True,1.0,gpt-5-mini,cobol-modernization,665.606813,True,1.0,True,665.606813 +7587ebcd-3cab-45c3-88b5-5b5000c5266b,gemini-2.5-pro,gemini,filter-js-from-html,2294,1612,3906,172.377752,False,0.0,gemini-2.5-pro,filter-js-from-html,172.377752,False,0.0,False,172.377752 +62d25046-bf12-4cb2-ac5a-c60d60d648a0,moonshotai/Kimi-K2-Instruct-0905,together_ai,wasm-pipeline,17381,7043,24424,916.817123,False,0.0,moonshotai/Kimi-K2-Instruct-0905,wasm-pipeline,916.817123,False,0.2,False,916.817123 +ecc90827-bd06-4590-b9b0-7be15348cbac,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,prove-plus-comm,1489,2031,3520,393.231077,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,prove-plus-comm,393.231077,False,0.0,False,393.231077 +b1100d68-0e07-496b-9cdb-615c581a86e5,grok-code-fast-1,xai,port-compressor,19342,21910,41252,1578.648033,False,0.0,grok-code-fast-1,port-compressor,1578.648033,False,0.0,False,1578.648033 +6a72c6a3-67b4-4a41-b12b-64d2d42f9ec0,claude-sonnet-4-20250514,anthropic,qemu-alpine-ssh,2736,4263,6999,600.721124,True,1.0,claude-sonnet-4-20250514,qemu-alpine-ssh,600.721124,True,0.6,True,600.721124 +77f7aeb1-5d27-4100-9012-cb2286ed7180,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,schemelike-metacircular-eval,2832,2655,5487,212.851608,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,schemelike-metacircular-eval,212.851608,False,0.0,False,212.851608 +43bda7f4-0edd-4200-aa9c-267cf18fe3c1,openai/gpt-oss-120b,together_ai,schemelike-metacircular-eval,7608,3389,10997,225.855565,False,0.0,openai/gpt-oss-120b,schemelike-metacircular-eval,225.855565,False,0.0,False,225.855565 +b5ad66fd-7890-4df2-ba41-bb9fdef2f075,openai/gpt-oss-120b,together_ai,filter-js-from-html,2424,1856,4280,173.466687,False,0.0,openai/gpt-oss-120b,filter-js-from-html,173.466687,False,0.0,False,173.466687 +391e5177-45a2-4255-92a7-0b602b13533a,claude-opus-4-1-20250805,anthropic,port-compressor,52673,36467,89140,3633.895463,False,0.0,claude-opus-4-1-20250805,port-compressor,3633.895463,False,0.0,False,3633.895463 +5e54f47e-bc87-4b9b-850d-83ff8aeb9e35,gpt-5-nano,openai,video-processing,3481,2872,6353,138.784426,False,0.0,gpt-5-nano,video-processing,138.784426,False,0.0,False,138.784426 +c7a18052-035d-419f-83df-cee2a0f02b56,openai/gpt-oss-120b,together_ai,cancel-async-tasks,1237,539,1776,80.955706,False,0.0,openai/gpt-oss-120b,cancel-async-tasks,80.955706,False,0.6,False,80.955706 +a8df12f3-9ecf-49c4-88ca-91d63b4851db,zai-org/GLM-4.5-Air-FP8,together_ai,distribution-search,844,3164,4008,263.069871,False,0.0,zai-org/GLM-4.5-Air-FP8,distribution-search,263.069871,False,0.0,False,263.069871 +f599bdca-c5f5-49a6-95c1-14a4a6ecbc66,claude-sonnet-4-20250514,anthropic,circuit-fibsqrt,22839,23267,46106,3129.493289,False,0.0,claude-sonnet-4-20250514,circuit-fibsqrt,3129.493289,False,0.0,False,3129.493289 +f8b929db-54db-4269-9509-fc13931d24de,gpt-5,openai,pytorch-model-recovery,9591,9294,18885,910.361005,False,0.0,gpt-5,pytorch-model-recovery,910.361005,False,0.4285714285714285,False,910.361005 +15ff763f-29f4-4ca5-ae72-b82a10cdf2dd,gpt-5-mini,openai,gpt2-codegolf,2098,1843,3941,119.737154,False,0.0,gpt-5-mini,gpt2-codegolf,119.737154,False,0.0,False,119.737154 +21eb4d38-b16d-403b-a017-0fd6fdd0555d,grok-4-0709,xai,dna-assembly,1155,336,1491,774.724666,False,0.0,grok-4-0709,dna-assembly,774.724666,False,0.0,False,774.724666 +12363f43-2d10-4ca4-81d1-9f8d53753b93,gemini-2.5-pro,gemini,password-recovery,1935,1473,3408,1590.976104,False,0.0,gemini-2.5-pro,password-recovery,1590.976104,False,0.0,False,1590.976104 +6d479389-503c-43d7-ac63-bc7b14ccff34,gpt-5-mini,openai,pypi-server,2962,1167,4129,145.250695,True,1.0,gpt-5-mini,pypi-server,145.250695,True,0.8,True,145.250695 +5033897a-554e-4b19-95b1-d604d04c8dc7,openai/gpt-oss-120b,together_ai,wasm-pipeline,2675,2361,5036,225.762332,False,0.0,openai/gpt-oss-120b,wasm-pipeline,225.762332,False,0.0,False,225.762332 +cebc8fed-ce0f-4dd8-aaa9-7f920a8da2b9,gemini-2.5-pro,gemini,adaptive-rejection-sampler,12513,13111,25624,906.747334,True,1.0,gemini-2.5-pro,adaptive-rejection-sampler,906.747334,True,0.4,True,906.747334 +c48b4a1f-c678-4ffd-9789-0f90e13c8252,gpt-5-mini,openai,mteb-retrieve,4688,3091,7779,369.050504,False,0.0,gpt-5-mini,mteb-retrieve,369.050504,False,0.0,False,369.050504 +a8fbac2b-d36d-4234-bb76-195f2a2d49e4,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing-reverse,12494,12392,24886,1264.466779,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing-reverse,1264.466779,False,0.0,False,1264.466779 +4035013f-411a-4e6d-819c-523e0766d3ae,openai/gpt-oss-120b,together_ai,regex-log,1238,824,2062,48.991195,True,1.0,openai/gpt-oss-120b,regex-log,48.991195,True,0.4,True,48.991195 +eca6dbc7-7f19-4ecc-9c63-c9d8cf7cf3fa,grok-4-0709,xai,mteb-leaderboard,932,456,1388,189.639165,False,0.0,grok-4-0709,mteb-leaderboard,189.639165,False,0.0,False,189.639165 +923ef369-abbd-4591-bfdd-31cd10a0af1d,claude-opus-4-1-20250805,anthropic,wasm-pipeline,11904,3144,15048,355.818902,False,0.0,claude-opus-4-1-20250805,wasm-pipeline,355.818902,False,0.1428571428571428,False,355.818902 +3c3d3ffa-5e36-48c5-bfaf-7f9e311e7db0,gemini-2.5-flash,gemini,build-pmars,9172,4318,13490,533.871312,True,1.0,gemini-2.5-flash,build-pmars,533.871312,True,0.8,True,533.871312 +777bf74f-c7e0-4a8d-8dc2-98ab0a5eb4e2,moonshotai/Kimi-K2-Instruct-0905,together_ai,sparql-university,8331,4909,13240,387.139545,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sparql-university,387.139545,False,0.0,False,387.139545 +f317dcb5-71ec-4ebb-b064-d37bf0ade247,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,configure-git-webserver,7761,2729,10490,900.290625,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,configure-git-webserver,900.290625,False,0.6,False,900.290625 +89986160-f9b2-46e5-886f-ce21d6fafc20,claude-opus-4-1-20250805,anthropic,run-pdp11-code,9362,5091,14453,414.240595,False,0.0,claude-opus-4-1-20250805,run-pdp11-code,414.240595,False,0.0,False,414.240595 +9eb795ae-0bc8-4eba-8d97-ce40189a1b00,claude-opus-4-1-20250805,anthropic,sqlite-db-truncate,7362,4331,11693,282.38081,False,0.0,claude-opus-4-1-20250805,sqlite-db-truncate,282.38081,False,0.125,False,282.38081 +5b464a34-6c95-410f-bc96-f8724038d091,gemini-2.5-flash,gemini,video-processing,3514,2998,6512,227.169432,False,0.0,gemini-2.5-flash,video-processing,227.169432,False,0.0,False,227.169432 +74226433-2b61-499f-9c66-61467bf2b2a1,gpt-5,openai,distribution-search,2893,1895,4788,255.047714,True,1.0,gpt-5,distribution-search,255.047714,True,1.0,True,255.047714 +e437a042-2d76-45b7-aa18-78aa7c1a09cc,deepseek-ai/DeepSeek-V3.1,together_ai,train-fasttext,31019,9506,40525,3600.03086,False,0.0,deepseek-ai/DeepSeek-V3.1,train-fasttext,3600.03086,False,0.0,False,3600.03086 +7ae47306-bb3e-4241-99b7-6f18db50f9ba,gpt-5-nano,openai,make-mips-interpreter,21233,18046,39279,1806.515231,False,0.0,gpt-5-nano,make-mips-interpreter,1806.515231,False,0.0,False,1806.515231 +148480b3-7dce-400e-8a8c-7f65956c58f3,zai-org/GLM-4.5-Air-FP8,together_ai,constraints-scheduling,5129,4665,9794,516.868172,True,1.0,zai-org/GLM-4.5-Air-FP8,constraints-scheduling,516.868172,True,0.8,True,516.868172 +68797e4d-8a6a-4d44-a779-a4ae5dc9e94c,gpt-5,openai,log-summary-date-ranges,5438,1409,6847,111.243658,False,0.0,gpt-5,log-summary-date-ranges,111.243658,False,0.0,False,111.243658 +6be48d70-e23f-4453-a59f-1bd47017efef,claude-opus-4-1-20250805,anthropic,qemu-alpine-ssh,3794,4746,8540,452.760669,True,1.0,claude-opus-4-1-20250805,qemu-alpine-ssh,452.760669,True,0.8571428571428571,True,452.760669 +58a2576f-8aa4-4715-b8cd-4d83f86390aa,grok-code-fast-1,xai,model-extraction-relu-logits,1466,880,2346,86.930158,False,0.0,grok-code-fast-1,model-extraction-relu-logits,86.930158,False,0.0,False,86.930158 +e635faf0-4425-491c-bb67-c68b6c4e2a3f,gpt-5-nano,openai,qemu-alpine-ssh,2783,3750,6533,900.117622,False,0.0,gpt-5-nano,qemu-alpine-ssh,900.117622,False,0.0,False,900.117622 +804f2b10-35f8-4b12-b73f-8efbb05db0be,grok-code-fast-1,xai,sparql-university,1478,777,2255,415.611983,False,0.0,grok-code-fast-1,sparql-university,415.611983,False,0.2,False,415.611983 +32cfe257-a021-422c-9268-133e1757e04c,gemini-2.5-flash,gemini,install-windows-3.11,2393,2714,5107,328.857361,False,0.0,gemini-2.5-flash,install-windows-3.11,328.857361,False,0.0,False,328.857361 +48139ece-b8f9-43c0-b830-ff8cd34ac5ab,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,extract-elf,4852,2890,7742,297.559173,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,extract-elf,297.559173,False,0.0,False,297.559173 +6271fe85-9d43-47f4-a2ac-f997485d4127,grok-4-0709,xai,distribution-search,2434,1934,4368,624.848846,True,1.0,grok-4-0709,distribution-search,624.848846,True,0.4,True,624.848846 +e8bf67b0-cf20-4ea3-9fe3-c133bb80eb11,gpt-5-mini,openai,sqlite-with-gcov,1662,1256,2918,509.833187,True,1.0,gpt-5-mini,sqlite-with-gcov,509.833187,True,1.0,True,509.833187 +f0867060-a089-4411-b006-491b8f2c45c0,gpt-5-mini,openai,torch-tensor-parallelism,2824,2662,5486,86.937252,False,0.0,gpt-5-mini,torch-tensor-parallelism,86.937252,False,0.0,False,86.937252 +6664bb92-73d1-4c85-9296-9136052280df,grok-code-fast-1,xai,sanitize-git-repo,5153,1459,6612,233.533343,False,0.0,grok-code-fast-1,sanitize-git-repo,233.533343,False,0.0,False,233.533343 +3cd9e1da-2db1-4267-b425-db8c50092902,gemini-2.5-pro,gemini,fix-ocaml-gc,25512,12438,37950,3600.095149,False,0.0,gemini-2.5-pro,fix-ocaml-gc,3600.095149,False,0.2,False,3600.095149 +28693443-691e-4ad7-b412-d92790eb616a,gpt-5-mini,openai,code-from-image,16418,17864,34282,1219.535198,False,0.0,gpt-5-mini,code-from-image,1219.535198,False,0.0,False,1219.535198 +0d8e6526-542a-4c3f-937a-3643c7b2826a,grok-code-fast-1,xai,vulnerable-secret,9189,4952,14141,287.634477,True,1.0,grok-code-fast-1,vulnerable-secret,287.634477,True,0.6,True,287.634477 +8aec5210-c091-43e9-b017-443c52659ff9,gpt-5-nano,openai,path-tracing,30641,29926,60567,1810.486239,False,0.0,gpt-5-nano,path-tracing,1810.486239,False,0.2,False,1810.486239 +bbffa713-9fbc-4c3a-9946-f8a63fc3d494,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-ocaml-gc,32997,11108,44105,3627.825435,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-ocaml-gc,3627.825435,False,0.0,False,3627.825435 +31903b1d-b565-410f-84b7-9818a9277888,claude-sonnet-4-20250514,anthropic,torch-tensor-parallelism,5938,4809,10747,155.309924,False,0.0,claude-sonnet-4-20250514,torch-tensor-parallelism,155.309924,False,0.0,False,155.309924 +40488afa-6691-4eb4-927f-fbfbf1cc9b9d,claude-sonnet-4-20250514,anthropic,reshard-c4-data,7779,7748,15527,900.401121,False,0.0,claude-sonnet-4-20250514,reshard-c4-data,900.401121,False,0.0,False,900.401121 +f14077fe-ccb2-4a70-b35f-a01dbd819a7a,moonshotai/Kimi-K2-Instruct-0905,together_ai,circuit-fibsqrt,33797,49876,83673,3624.453492,False,0.0,moonshotai/Kimi-K2-Instruct-0905,circuit-fibsqrt,3624.453492,False,0.0,False,3624.453492 +dbafe363-3c24-4999-93cb-a804603d4e3b,grok-4-0709,xai,regex-log,1774,1624,3398,583.490481,True,1.0,grok-4-0709,regex-log,583.490481,True,0.6,True,583.490481 +4befc5da-a436-472a-abb8-ad979455e306,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,port-compressor,74227,49249,123476,3600.001221,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,port-compressor,3600.001221,False,0.0,False,3600.001221 +ee4465a5-b328-43ba-bbb5-d91594eb5a21,grok-code-fast-1,xai,torch-tensor-parallelism,2156,1436,3592,49.039392,False,0.0,grok-code-fast-1,torch-tensor-parallelism,49.039392,False,0.0,False,49.039392 +8027bb23-315d-40b5-99c0-4a04fbd15e2b,gemini-2.5-pro,gemini,break-filter-js-from-html,4241,4105,8346,1203.268636,False,0.0,gemini-2.5-pro,break-filter-js-from-html,1203.268636,False,0.2,False,1203.268636 +06212dbc-e651-40e9-b820-52531b9c06a2,OpenAI/gpt-oss-20B,together_ai,bn-fit-modify,1351,4315,5666,79.49707,False,0.0,OpenAI/gpt-oss-20B,bn-fit-modify,79.49707,False,0.0,False,79.49707 +36df6a28-2cf1-4861-aa2f-08ce10a5e1d7,claude-opus-4-1-20250805,anthropic,prove-plus-comm,2087,1717,3804,159.007377,True,1.0,claude-opus-4-1-20250805,prove-plus-comm,159.007377,True,1.0,True,159.007377 +f5d40646-39de-420c-86f3-af650d44e9fd,openai/gpt-oss-120b,together_ai,sanitize-git-repo,5491,3089,8580,145.117085,False,0.0,openai/gpt-oss-120b,sanitize-git-repo,145.117085,False,0.0,False,145.117085 +11446b26-35c5-4cc9-a4ae-eec840dd62ce,zai-org/GLM-4.5-Air-FP8,together_ai,filter-js-from-html,520,1434,1954,128.306812,False,0.0,zai-org/GLM-4.5-Air-FP8,filter-js-from-html,128.306812,False,0.0,False,128.306812 +4607115f-432f-4e0e-bece-d5d02e19497b,gpt-5-mini,openai,qemu-alpine-ssh,786,1496,2282,982.850539,False,0.0,gpt-5-mini,qemu-alpine-ssh,982.850539,False,0.0,False,982.850539 +8af0a91e-0c19-4366-86bb-128e0b8970f5,deepseek-ai/DeepSeek-V3.1,together_ai,db-wal-recovery,3899,4165,8064,917.66822,False,0.0,deepseek-ai/DeepSeek-V3.1,db-wal-recovery,917.66822,False,0.0,False,917.66822 +b0a394fe-201b-46a1-88b6-574265e54ecf,claude-opus-4-1-20250805,anthropic,train-fasttext,16917,5281,22198,4868.621336,False,0.0,claude-opus-4-1-20250805,train-fasttext,4868.621336,False,0.2857142857142857,False,4868.621336 +44b5a656-d655-4031-8d57-c5e7afb47324,gpt-5,openai,large-scale-text-editing,6122,3747,9869,908.91406,False,0.0,gpt-5,large-scale-text-editing,908.91406,False,0.4285714285714285,False,908.91406 +6f0f7620-6e0f-40a2-8f47-e16b1ebb3a1d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,break-filter-js-from-html,10891,11440,22331,1156.883808,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,break-filter-js-from-html,1156.883808,False,0.0,False,1156.883808 +9b67c678-9b71-4b5b-aa21-c6deef3ade25,zai-org/GLM-4.5-Air-FP8,together_ai,model-extraction-relu-logits,1727,1782,3509,191.329676,False,0.0,zai-org/GLM-4.5-Air-FP8,model-extraction-relu-logits,191.329676,False,0.2,False,191.329676 +11f82b89-1f7f-49b5-88d5-728824e335eb,OpenAI/gpt-oss-20B,together_ai,circuit-fibsqrt,186,502,688,103.985823,False,0.0,OpenAI/gpt-oss-20B,circuit-fibsqrt,103.985823,False,0.0,False,103.985823 +375481d8-a9a3-4aaf-b391-db02f50a686e,claude-opus-4-1-20250805,anthropic,wasm-pipeline,11126,2851,13977,774.733994,False,0.0,claude-opus-4-1-20250805,wasm-pipeline,774.733994,False,0.1428571428571428,False,774.733994 +9d5649f7-075e-4a87-b075-5d7ced8de2b0,grok-4-0709,xai,sanitize-git-repo,7597,1586,9183,340.71191,False,0.0,grok-4-0709,sanitize-git-repo,340.71191,False,0.0,False,340.71191 +939960f1-6c39-4330-9dd4-9a1918291666,claude-sonnet-4-20250514,anthropic,write-compressor,7407,8378,15785,900.03297,False,0.0,claude-sonnet-4-20250514,write-compressor,900.03297,False,0.0,False,900.03297 +bdd8a5cd-0329-4b93-b729-cc2be43efd06,moonshotai/Kimi-K2-Instruct-0905,together_ai,bn-fit-modify,26629,13417,40046,927.795137,False,0.0,moonshotai/Kimi-K2-Instruct-0905,bn-fit-modify,927.795137,False,0.0,False,927.795137 +e8ab8e51-c1b7-4b15-84fd-0496f67529e2,OpenAI/gpt-oss-20B,together_ai,model-extraction-relu-logits,75,438,513,1421.58791,False,0.0,OpenAI/gpt-oss-20B,model-extraction-relu-logits,1421.58791,False,0.0,False,1421.58791 +75b38d80-0150-418a-874c-66d755627a38,gpt-5-mini,openai,port-compressor,31310,32850,64160,3605.167486,False,0.0,gpt-5-mini,port-compressor,3605.167486,False,0.0,False,3605.167486 +803c1e68-4163-4e0b-97e2-5ef7f7023c76,gemini-2.5-flash,gemini,fix-ocaml-gc,63513,58244,121757,3600.001254,False,0.0,gemini-2.5-flash,fix-ocaml-gc,3600.001254,False,0.0,False,3600.001254 +61675f35-6b20-4de5-ac87-ff924acc7bdf,moonshotai/Kimi-K2-Instruct-0905,together_ai,gpt2-codegolf,10514,11489,22003,900.028442,False,0.0,moonshotai/Kimi-K2-Instruct-0905,gpt2-codegolf,900.028442,False,0.0,False,900.028442 +b5f2ac72-f0bf-4b5a-88e2-9466b5bf0c68,claude-opus-4-1-20250805,anthropic,build-pov-ray,16625,6974,23599,637.10085,False,0.0,claude-opus-4-1-20250805,build-pov-ray,637.10085,False,0.75,False,637.10085 +2317eb39-2e5d-4794-8b57-c4a87b9f7051,grok-4-0709,xai,password-recovery,5399,1446,6845,907.419619,False,0.0,grok-4-0709,password-recovery,907.419619,False,0.0,False,907.419619 +9bc01c59-3d10-4014-a7a3-6fb702755c5b,OpenAI/gpt-oss-20B,together_ai,qemu-alpine-ssh,491,1346,1837,61.027218,False,0.0,OpenAI/gpt-oss-20B,qemu-alpine-ssh,61.027218,False,0.0,False,61.027218 +b48883c5-a60a-4eb0-83e5-2010edbeb4c6,gemini-2.5-flash,gemini,db-wal-recovery,2120,3093,5213,965.916599,False,0.0,gemini-2.5-flash,db-wal-recovery,965.916599,False,0.0,False,965.916599 +b58fbf32-6dc4-47e9-aed2-5ced4fd17880,zai-org/GLM-4.5-Air-FP8,together_ai,extract-elf,6088,1781,7869,382.428815,False,0.0,zai-org/GLM-4.5-Air-FP8,extract-elf,382.428815,False,0.4,False,382.428815 +3c5b00a7-5aa4-4d35-85ba-0bdaf4de0e53,grok-4-0709,xai,mteb-leaderboard,919,383,1302,187.180532,False,0.0,grok-4-0709,mteb-leaderboard,187.180532,False,0.0,False,187.180532 +ef49ec7b-fc99-4196-acbf-87725925b51c,claude-sonnet-4-20250514,anthropic,fix-ocaml-gc,36303,19800,56103,3600.63477,False,0.0,claude-sonnet-4-20250514,fix-ocaml-gc,3600.63477,False,0.0,False,3600.63477 +141d9282-e97b-4bf6-9fb8-75b76bc11444,grok-4-0709,xai,cobol-modernization,5294,4761,10055,877.583253,True,1.0,grok-4-0709,cobol-modernization,877.583253,True,0.2,True,877.583253 +ed42c328-f2f6-4c65-b5ca-c0a47bc9ad4d,moonshotai/Kimi-K2-Instruct-0905,together_ai,port-compressor,26556,14930,41486,3601.387825,False,0.0,moonshotai/Kimi-K2-Instruct-0905,port-compressor,3601.387825,False,0.0,False,3601.387825 +f3d56195-48ad-4244-8618-3389b534b8c0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,torch-tensor-parallelism,15190,4138,19328,915.468369,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,torch-tensor-parallelism,915.468369,False,0.0,False,915.468369 +162b9cfd-00af-4ddd-9470-5bb9f62cc793,gpt-5,openai,sqlite-db-truncate,3375,3131,6506,121.735473,False,0.0,gpt-5,sqlite-db-truncate,121.735473,False,0.0,False,121.735473 +34746c8c-c141-4dc3-bc2a-a2a1153fcf22,gpt-5-mini,openai,code-from-image,26304,21655,47959,1201.814291,False,0.0,gpt-5-mini,code-from-image,1201.814291,False,0.0,False,1201.814291 +e76868f1-86b9-47a3-9928-2c714b562908,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-recovery,25576,7488,33064,924.298777,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-recovery,924.298777,False,0.0,False,924.298777 +ae90ff68-d2ef-4557-a55e-6e07c1df3428,claude-sonnet-4-20250514,anthropic,tune-mjcf,6965,5190,12155,335.184879,True,1.0,claude-sonnet-4-20250514,tune-mjcf,335.184879,True,0.2,True,335.184879 +fc8c6c13-7325-4e9f-9801-af2bbe1f7dca,claude-opus-4-1-20250805,anthropic,qemu-startup,2757,2565,5322,296.10671,False,0.0,claude-opus-4-1-20250805,qemu-startup,296.10671,False,0.4285714285714285,False,296.10671 +d1669f60-bd1a-4b26-95b0-3ee7629fb867,gpt-5-mini,openai,configure-git-webserver,2141,2104,4245,388.061256,True,1.0,gpt-5-mini,configure-git-webserver,388.061256,True,0.6,True,388.061256 +d9ce4c6b-953a-4ad8-85bb-fd3bf6881c7c,zai-org/GLM-4.5-Air-FP8,together_ai,install-windows-3.11,9309,4089,13398,131.930154,False,0.0,zai-org/GLM-4.5-Air-FP8,install-windows-3.11,131.930154,False,0.0,False,131.930154 +833951b4-feb0-4d46-84e3-d9e215ee1736,grok-4-0709,xai,prove-plus-comm,2086,1304,3390,329.157309,True,1.0,grok-4-0709,prove-plus-comm,329.157309,True,0.8,True,329.157309 +d90bf36b-518c-42b3-9255-110f25defc72,deepseek-ai/DeepSeek-V3.1,together_ai,hf-model-inference,4169,1565,5734,912.199275,True,1.0,deepseek-ai/DeepSeek-V3.1,hf-model-inference,912.199275,True,0.8,True,912.199275 +5b30fff9-c502-48f3-a49a-859a5626461c,claude-sonnet-4-20250514,anthropic,financial-document-processor,18329,9762,28091,740.840784,False,0.0,claude-sonnet-4-20250514,financial-document-processor,740.840784,False,0.2,False,740.840784 +75fb856c-4ce4-46fa-b750-a34deefde633,grok-code-fast-1,xai,merge-diff-arc-agi-task,9143,3577,12720,845.071644,True,1.0,grok-code-fast-1,merge-diff-arc-agi-task,845.071644,True,0.8,True,845.071644 +de09ea5d-cf82-492e-8481-85787f7476f5,gemini-2.5-flash,gemini,vulnerable-secret,3879,34192,38071,921.406055,False,0.0,gemini-2.5-flash,vulnerable-secret,921.406055,False,0.0,False,921.406055 +85b875e5-39c2-4a37-8a9a-a04fc20b3404,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-klee-minimal,11247,3672,14919,904.160487,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-klee-minimal,904.160487,False,0.0,False,904.160487 +a6c234d0-7f6e-4d6e-8bf6-5597ad03552d,gpt-5-nano,openai,mteb-leaderboard,22467,35895,58362,3630.082023,False,0.0,gpt-5-nano,mteb-leaderboard,3630.082023,False,0.0,False,3630.082023 +a30284fc-2f41-4915-a4f1-87cd77e32f83,deepseek-ai/DeepSeek-V3.1,together_ai,dna-insert,12766,8913,21679,360.002678,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-insert,360.002678,False,0.0,False,360.002678 +c3d1d64d-1011-42e9-a4b2-7b14d8caa603,openai/gpt-oss-120b,together_ai,merge-diff-arc-agi-task,4294,2217,6511,154.486227,False,0.0,openai/gpt-oss-120b,merge-diff-arc-agi-task,154.486227,False,0.0,False,154.486227 +cea19262-85af-4737-b330-9a2005df59da,grok-4-0709,xai,break-filter-js-from-html,1864,1580,3444,1210.270347,False,0.0,grok-4-0709,break-filter-js-from-html,1210.270347,False,0.0,False,1210.270347 +924f6034-22de-4b5f-9daa-f5a9151f7a97,OpenAI/gpt-oss-20B,together_ai,code-from-image,269,387,656,64.803339,False,0.0,OpenAI/gpt-oss-20B,code-from-image,64.803339,False,0.0,False,64.803339 +ab3d2779-b0d2-4960-8c7f-5c1c30ee59f4,grok-4-0709,xai,prove-plus-comm,2701,1691,4392,638.25612,True,1.0,grok-4-0709,prove-plus-comm,638.25612,True,0.8,True,638.25612 +97e3683b-adaa-4f8a-87e9-0b43f3566e90,gpt-5-mini,openai,reverse-engineering,17836,16499,34335,2071.097966,False,0.0,gpt-5-mini,reverse-engineering,2071.097966,False,0.0,False,2071.097966 +b66f9625-a8c4-487d-b5f0-9db98fe2da4e,deepseek-ai/DeepSeek-V3.1,together_ai,chess-best-move,17612,5167,22779,410.467958,False,0.0,deepseek-ai/DeepSeek-V3.1,chess-best-move,410.467958,False,0.0,False,410.467958 +2116a837-169f-4d29-a5de-5211a5320707,gpt-5-nano,openai,vulnerable-secret,3506,4121,7627,433.439086,True,1.0,gpt-5-nano,vulnerable-secret,433.439086,True,0.2,True,433.439086 +4cc61104-c20a-40c9-a5c6-db5500ac786f,openai/gpt-oss-120b,together_ai,log-summary-date-ranges,3852,1835,5687,116.518906,False,0.0,openai/gpt-oss-120b,log-summary-date-ranges,116.518906,False,0.0,False,116.518906 +c2385ee8-b2d3-4c06-b743-d5efde999f1b,OpenAI/gpt-oss-20B,together_ai,nginx-request-logging,1251,1235,2486,199.520646,False,0.0,OpenAI/gpt-oss-20B,nginx-request-logging,199.520646,False,0.0,False,199.520646 +85ccd1dc-8474-4311-8f5b-4d7e22ac6358,moonshotai/Kimi-K2-Instruct-0905,together_ai,distribution-search,20308,19241,39549,1894.392897,False,0.0,moonshotai/Kimi-K2-Instruct-0905,distribution-search,1894.392897,False,0.2,False,1894.392897 +bc86da49-4e7d-43f8-82c2-285937f191ae,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,prove-plus-comm,1502,1260,2762,43.522987,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,prove-plus-comm,43.522987,False,0.0,False,43.522987 +98091376-b51e-4e89-9202-c1f81028fef5,gpt-5-nano,openai,hf-model-inference,2653,2960,5613,902.801198,False,0.0,gpt-5-nano,hf-model-inference,902.801198,False,0.4,False,902.801198 +a5e4f0bd-a43f-4ae8-85fe-0ef66ea804db,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reverse-engineering,6865,7473,14338,1800.046909,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reverse-engineering,1800.046909,False,0.0,False,1800.046909 +90c3eb82-fe6b-4932-be3d-0839a4e097c3,grok-4-0709,xai,qemu-alpine-ssh,1563,1154,2717,251.76765,False,0.0,grok-4-0709,qemu-alpine-ssh,251.76765,False,0.0,False,251.76765 +d34bf7d6-1b8c-45c3-bc20-41884ae6f456,gpt-5,openai,path-tracing,10996,7299,18295,1854.889349,False,0.0,gpt-5,path-tracing,1854.889349,False,0.0,False,1854.889349 +7f6f52d4-ea16-4dda-a939-e97125f3c238,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-c-py,8920,10366,19286,900.018897,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-c-py,900.018897,False,0.0,False,900.018897 +86622a61-f9e8-4d0b-92e1-a181fca4b05f,deepseek-ai/DeepSeek-V3.1,together_ai,port-compressor,51271,34832,86103,758.673041,False,0.0,deepseek-ai/DeepSeek-V3.1,port-compressor,758.673041,False,0.0,False,758.673041 +cb14cfbb-c94d-4084-b37e-911fe14b8535,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,vulnerable-secret,14100,6814,20914,883.723027,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,vulnerable-secret,883.723027,True,0.4,True,883.723027 +0467048b-359c-4fbc-b476-c0da50e7b624,grok-code-fast-1,xai,winning-avg-corewars,12842,8186,21028,574.616095,False,0.0,grok-code-fast-1,winning-avg-corewars,574.616095,False,0.0,False,574.616095 +b176b07f-ca2d-408e-aa9b-3414a26fc467,grok-4-0709,xai,install-klee-minimal,11189,2172,13361,908.183209,False,0.0,grok-4-0709,install-klee-minimal,908.183209,False,0.0,False,908.183209 +5e4b6f8d-b35e-4793-9f6d-c74b37a9e9e5,grok-code-fast-1,xai,write-compressor,3732,2305,6037,234.927039,False,0.0,grok-code-fast-1,write-compressor,234.927039,False,0.0,False,234.927039 +6e6d6d57-1538-4828-a31e-9f5deec24cd9,gemini-2.5-pro,gemini,db-wal-recovery,10935,4534,15469,903.184844,False,0.0,gemini-2.5-pro,db-wal-recovery,903.184844,False,0.0,False,903.184844 +342a6d2b-e1d9-429a-adf3-5c1287115a2c,grok-code-fast-1,xai,qemu-startup,1391,1187,2578,134.143608,False,0.0,grok-code-fast-1,qemu-startup,134.143608,False,0.0,False,134.143608 +0746c0de-34ec-481b-b047-43df4731a485,claude-opus-4-1-20250805,anthropic,path-tracing,58376,55840,114216,1800.001086,False,0.0,claude-opus-4-1-20250805,path-tracing,1800.001086,False,0.0,False,1800.001086 +2a6609c0-65b1-47f6-abb1-b00fef77a766,claude-opus-4-1-20250805,anthropic,count-dataset-tokens,8306,2608,10914,176.177157,False,0.0,claude-opus-4-1-20250805,count-dataset-tokens,176.177157,False,0.0,False,176.177157 +242d06d7-714c-4f0b-8b18-aea9c13ffaf7,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-with-gcov,9375,2454,11829,674.239474,False,0.0,zai-org/GLM-4.5-Air-FP8,sqlite-with-gcov,674.239474,False,0.6,False,674.239474 +97fcdb6c-20d8-433f-abd1-c71b85cd7324,deepseek-ai/DeepSeek-V3.1,together_ai,merge-diff-arc-agi-task,18978,11400,30378,387.762671,False,0.0,deepseek-ai/DeepSeek-V3.1,merge-diff-arc-agi-task,387.762671,False,0.2,False,387.762671 +6747793e-147a-4d60-9c25-5b13ee9946ab,zai-org/GLM-4.5-Air-FP8,together_ai,log-summary-date-ranges,7494,2633,10127,76.797332,True,1.0,zai-org/GLM-4.5-Air-FP8,log-summary-date-ranges,76.797332,True,0.8,True,76.797332 +de8815d3-c935-4a74-a7fe-af4eccf048c6,grok-code-fast-1,xai,count-dataset-tokens,10992,2945,13937,255.548271,False,0.0,grok-code-fast-1,count-dataset-tokens,255.548271,False,0.0,False,255.548271 +8b9d43ac-8bcb-44b7-afc7-0c0e222215f7,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,schemelike-metacircular-eval,24331,24935,49266,1993.440478,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,schemelike-metacircular-eval,1993.440478,False,0.0,False,1993.440478 +455b84ed-16fe-4d1b-8c20-5eded2d7c0f7,deepseek-ai/DeepSeek-V3.1,together_ai,git-leak-recovery,2485,1508,3993,86.361018,True,1.0,deepseek-ai/DeepSeek-V3.1,git-leak-recovery,86.361018,True,0.6,True,86.361018 +6626d907-53dc-493f-a9d5-1c26a5a909a7,gpt-5-nano,openai,openssl-selfsigned-cert,11841,14620,26461,907.278233,False,0.0,gpt-5-nano,openssl-selfsigned-cert,907.278233,False,0.6,False,907.278233 +f52872bf-7858-4875-85b8-93ad80211795,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,run-pdp11-code,5933,1353,7286,141.756492,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,run-pdp11-code,141.756492,False,0.0,False,141.756492 +c8b5b68b-7386-4a2c-8763-7a2078e51065,claude-opus-4-1-20250805,anthropic,large-scale-text-editing,6138,4297,10435,315.583443,False,0.0,claude-opus-4-1-20250805,large-scale-text-editing,315.583443,False,0.6666666666666666,False,315.583443 +b37c917b-c336-4b4c-89b8-2c46c5227376,gemini-2.5-pro,gemini,torch-tensor-parallelism,2038,1413,3451,71.931027,False,0.0,gemini-2.5-pro,torch-tensor-parallelism,71.931027,False,0.0,False,71.931027 +7cc81acf-c15b-4148-bd0e-e82fc04c9447,claude-opus-4-1-20250805,anthropic,dna-insert,7517,4418,11935,145.54479,False,0.0,claude-opus-4-1-20250805,dna-insert,145.54479,False,0.0,False,145.54479 +cdb4125b-aab0-4e5b-ae65-d04645d202ff,claude-opus-4-1-20250805,anthropic,write-compressor,21675,19311,40986,900.00478,False,0.0,claude-opus-4-1-20250805,write-compressor,900.00478,False,0.0,False,900.00478 +90be352b-40b1-4d3b-aedb-7baca3e0d05f,OpenAI/gpt-oss-20B,together_ai,extract-elf,610,1415,2025,42.176015,False,0.0,OpenAI/gpt-oss-20B,extract-elf,42.176015,False,0.2,False,42.176015 +f50b997e-5703-4006-8c6d-0aa3590f3f6c,claude-sonnet-4-20250514,anthropic,schemelike-metacircular-eval,18312,15127,33439,2400.026386,False,0.0,claude-sonnet-4-20250514,schemelike-metacircular-eval,2400.026386,False,0.0,False,2400.026386 +ad0752fc-e8fb-4647-aefd-387f1b0ffd4f,zai-org/GLM-4.5-Air-FP8,together_ai,build-initramfs-qemu,5510,3077,8587,284.491387,False,0.0,zai-org/GLM-4.5-Air-FP8,build-initramfs-qemu,284.491387,False,0.0,False,284.491387 +855c43de-db94-4716-bd16-447df015a462,gpt-5-nano,openai,install-klee-minimal,4103,1786,5889,908.930039,False,0.0,gpt-5-nano,install-klee-minimal,908.930039,False,0.0,False,908.930039 +0f2bae12-7846-4c95-be69-4cfb7d4428b2,zai-org/GLM-4.5-Air-FP8,together_ai,adaptive-rejection-sampler,14769,12622,27391,900.006828,False,0.0,zai-org/GLM-4.5-Air-FP8,adaptive-rejection-sampler,900.006828,False,0.0,False,900.006828 +9592c3f0-7cc6-4178-9fd4-d5b12a2c7165,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,video-processing,5106,4243,9349,370.757384,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,video-processing,370.757384,False,0.0,False,370.757384 +9c941f45-1745-4981-9daa-7810f42a497a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-code-vulnerability,17983,8598,26581,900.661841,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-code-vulnerability,900.661841,False,0.4,False,900.661841 +f7f8a619-775b-4943-b928-b62e1f1b0a58,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,bn-fit-modify,16703,8183,24886,766.836765,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,bn-fit-modify,766.836765,False,0.0,False,766.836765 +3b63fa9d-4a69-4516-b287-e02da3b7abbf,gemini-2.5-pro,gemini,largest-eigenval,5696,4533,10229,900.000734,False,0.0,gemini-2.5-pro,largest-eigenval,900.000734,False,0.0,False,900.000734 +775c5cd7-3231-475c-9df8-285ce29f09b4,claude-opus-4-1-20250805,anthropic,make-mips-interpreter,26107,23325,49432,1800.101062,False,0.0,claude-opus-4-1-20250805,make-mips-interpreter,1800.101062,False,0.0,False,1800.101062 +1a96515e-cd03-4409-b6c9-f5529def8d50,moonshotai/Kimi-K2-Instruct-0905,together_ai,pypi-server,8359,5782,14141,667.874785,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pypi-server,667.874785,False,0.2,False,667.874785 +2b10c226-9066-4427-9cba-04d42132dc88,gpt-5,openai,polyglot-c-py,1441,1685,3126,281.662106,False,0.0,gpt-5,polyglot-c-py,281.662106,False,0.0,False,281.662106 +78e2e2b6-991b-4273-834d-4955844f83ee,grok-code-fast-1,xai,dna-insert,5225,1798,7023,190.506054,False,0.0,grok-code-fast-1,dna-insert,190.506054,False,0.0,False,190.506054 +6bafa982-1d1f-4c1d-8a4a-69a934c4bd71,gpt-5,openai,make-mips-interpreter,14544,32754,47298,1809.734291,False,0.0,gpt-5,make-mips-interpreter,1809.734291,False,0.0,False,1809.734291 +856688c1-a118-4a91-87f9-6d6ceec6479f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,torch-tensor-parallelism,4384,3184,7568,171.888906,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,torch-tensor-parallelism,171.888906,False,0.0,False,171.888906 +59b5f829-1e37-4cd7-9f05-8ee6c1d89995,claude-sonnet-4-20250514,anthropic,financial-document-processor,20079,6302,26381,486.849086,False,0.0,claude-sonnet-4-20250514,financial-document-processor,486.849086,False,0.2,False,486.849086 +e6b2a61f-ec42-4867-af51-4563257f6369,gpt-5-mini,openai,sparql-university,4146,3235,7381,171.778461,False,0.0,gpt-5-mini,sparql-university,171.778461,False,0.0,False,171.778461 +aa83a5bc-d5b8-40fc-8454-ee84a5f9d40c,OpenAI/gpt-oss-20B,together_ai,sqlite-db-truncate,1148,1872,3020,78.374347,False,0.0,OpenAI/gpt-oss-20B,sqlite-db-truncate,78.374347,False,0.0,False,78.374347 +26729bb1-d9ff-4d90-bd8d-56932cb0d7b4,claude-sonnet-4-20250514,anthropic,pypi-server,6475,4995,11470,518.259086,True,1.0,claude-sonnet-4-20250514,pypi-server,518.259086,True,0.8,True,518.259086 +405403de-3306-45bb-b4ee-d0b097e5f5b8,gemini-2.5-flash,gemini,reverse-engineering,17468,11725,29193,727.750811,False,0.0,gemini-2.5-flash,reverse-engineering,727.750811,False,0.0,False,727.750811 +8a89b0a1-41f0-451f-a839-06e15dc9bee6,openai/gpt-oss-120b,together_ai,write-compressor,7116,5893,13009,900.034653,False,0.0,openai/gpt-oss-120b,write-compressor,900.034653,False,0.0,False,900.034653 +c12db0fb-59fb-409f-8a42-3e9aa3a207e2,gpt-5-mini,openai,password-recovery,4514,7104,11618,915.622287,False,0.0,gpt-5-mini,password-recovery,915.622287,False,0.0,False,915.622287 +aa63a451-665d-4dd6-84f0-17468df2227d,grok-code-fast-1,xai,fix-code-vulnerability,16849,6584,23433,900.071085,False,0.0,grok-code-fast-1,fix-code-vulnerability,900.071085,False,0.0,False,900.071085 +dfe57fb1-f712-413d-a882-bbabad11d763,claude-opus-4-1-20250805,anthropic,qemu-alpine-ssh,2482,2460,4942,216.84273,True,1.0,claude-opus-4-1-20250805,qemu-alpine-ssh,216.84273,True,0.8571428571428571,True,216.84273 +c3e27173-fb80-472d-8eb0-36b0f157a96e,gpt-5,openai,build-cython-ext,4769,4592,9361,900.031282,False,0.0,gpt-5,build-cython-ext,900.031282,False,0.0,False,900.031282 +06db5486-4be0-4420-a5dd-06196167f155,moonshotai/Kimi-K2-Instruct-0905,together_ai,port-compressor,58299,33417,91716,3618.151075,False,0.0,moonshotai/Kimi-K2-Instruct-0905,port-compressor,3618.151075,False,0.0,False,3618.151075 +f6c2aae5-9a7c-4670-9fcc-51c0a8a8f1f5,gpt-5-mini,openai,password-recovery,7027,5911,12938,900.104368,False,0.0,gpt-5-mini,password-recovery,900.104368,False,0.0,False,900.104368 +46815717-e762-4fac-9c27-cb64ac1e78a0,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-with-gcov,14035,2871,16906,508.10642,False,0.0,zai-org/GLM-4.5-Air-FP8,sqlite-with-gcov,508.10642,False,0.6,False,508.10642 +ce6b390c-9cb0-43e2-a581-b7cd2f8ef136,grok-code-fast-1,xai,mteb-leaderboard,930,441,1371,334.936862,False,0.0,grok-code-fast-1,mteb-leaderboard,334.936862,False,0.0,False,334.936862 +c6adf3d9-f323-481f-a15f-75adf828209b,zai-org/GLM-4.5-Air-FP8,together_ai,run-pdp11-code,5517,5102,10619,555.972537,False,0.0,zai-org/GLM-4.5-Air-FP8,run-pdp11-code,555.972537,False,0.0,False,555.972537 +6358a638-898e-470f-8e83-71e5ed5da4e6,gemini-2.5-flash,gemini,polyglot-rust-c,2334,3813,6147,207.448773,False,0.0,gemini-2.5-flash,polyglot-rust-c,207.448773,False,0.0,False,207.448773 +a0982491-253e-488f-9e63-cd1163e81581,gemini-2.5-flash,gemini,circuit-fibsqrt,34068,63885,97953,3605.968766,False,0.0,gemini-2.5-flash,circuit-fibsqrt,3605.968766,False,0.0,False,3605.968766 +d9161c9e-95b9-404e-8e29-5e2806179721,OpenAI/gpt-oss-20B,together_ai,chess-best-move,269,826,1095,35.322172,False,0.0,OpenAI/gpt-oss-20B,chess-best-move,35.322172,False,0.0,False,35.322172 +3d9e25c2-33b9-459f-a20c-ed3e951a6e5e,gemini-2.5-flash,gemini,build-pov-ray,18948,7437,26385,786.053583,False,0.0,gemini-2.5-flash,build-pov-ray,786.053583,False,0.0,False,786.053583 +53057808-b2b1-4c79-b74e-8f5d347f9681,gpt-5-nano,openai,extract-elf,19791,14680,34471,794.774017,True,1.0,gpt-5-nano,extract-elf,794.774017,True,0.2,True,794.774017 +a8203cf0-f2d6-4f59-91da-80b8b0c3076d,grok-code-fast-1,xai,form-filling,7743,5802,13545,310.594237,True,1.0,grok-code-fast-1,form-filling,310.594237,True,0.6,True,310.594237 +51edb7ae-065b-4b87-8b97-ca0ab23d0e58,gemini-2.5-pro,gemini,path-tracing-reverse,6742,5450,12192,867.449715,False,0.0,gemini-2.5-pro,path-tracing-reverse,867.449715,False,0.0,False,867.449715 +aced6db1-10a1-4e04-bd71-1e5fadde2767,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-startup,4225,7551,11776,471.67324,False,0.0,zai-org/GLM-4.5-Air-FP8,qemu-startup,471.67324,False,0.2,False,471.67324 +e0b03cca-11df-45ca-8229-5dcec2e172ce,OpenAI/gpt-oss-20B,together_ai,feal-differential-cryptanalysis,1736,8239,9975,2439.887236,False,0.0,OpenAI/gpt-oss-20B,feal-differential-cryptanalysis,2439.887236,False,0.0,False,2439.887236 +54efa7af-b259-4c81-8b78-cbd714ec1683,openai/gpt-oss-120b,together_ai,crack-7z-hash,11025,6457,17482,459.091632,False,0.0,openai/gpt-oss-120b,crack-7z-hash,459.091632,False,0.0,False,459.091632 +9adf687d-9e4b-4a7b-a3e3-1a7cedb106ad,gpt-5,openai,constraints-scheduling,3569,1421,4990,330.293856,True,1.0,gpt-5,constraints-scheduling,330.293856,True,0.8571428571428571,True,330.293856 +1f283767-4817-4621-b07d-44965a467ca5,gemini-2.5-pro,gemini,make-doom-for-mips,16809,3985,20794,905.351779,False,0.0,gemini-2.5-pro,make-doom-for-mips,905.351779,False,0.0,False,905.351779 +75785621-085c-42c0-8e81-a311e07ee265,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-code-vulnerability,13584,5644,19228,551.125782,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-code-vulnerability,551.125782,True,0.4,True,551.125782 +3943b20c-5e58-43e3-9076-ccef81806721,gemini-2.5-flash,gemini,vulnerable-secret,7627,8069,15696,900.256038,False,0.0,gemini-2.5-flash,vulnerable-secret,900.256038,False,0.0,False,900.256038 +879cef1a-291d-41ff-8e8b-723d9443e3ba,gpt-5-mini,openai,qemu-alpine-ssh,3954,6891,10845,941.082539,False,0.0,gpt-5-mini,qemu-alpine-ssh,941.082539,False,0.0,False,941.082539 +f6a6cef1-d9d8-4245-8f87-fb3f3f47e48e,gpt-5,openai,chess-best-move,14392,10309,24701,902.477519,False,0.0,gpt-5,chess-best-move,902.477519,False,0.0,False,902.477519 +6338fa2a-0fd2-4c02-935e-2f89055bf215,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-with-gcov,9338,1425,10763,392.713251,True,1.0,deepseek-ai/DeepSeek-V3.1,sqlite-with-gcov,392.713251,True,0.8,True,392.713251 +055fa93a-23d9-4288-bddb-ee846c467655,gpt-5-mini,openai,wasm-pipeline,6316,6265,12581,322.877102,True,1.0,gpt-5-mini,wasm-pipeline,322.877102,True,0.6,True,322.877102 +23209f71-78f2-4b62-994b-8000a97430c8,gpt-5-mini,openai,pytorch-model-recovery,6982,7691,14673,402.367435,False,0.0,gpt-5-mini,pytorch-model-recovery,402.367435,False,0.0,False,402.367435 +6bc07c9a-12d2-4db9-95c7-869a58990822,deepseek-ai/DeepSeek-V3.1,together_ai,build-cython-ext,15227,4938,20165,590.375358,False,0.0,deepseek-ai/DeepSeek-V3.1,build-cython-ext,590.375358,False,0.0,False,590.375358 +55fa376c-6a82-481a-9290-ae8db06fb526,claude-sonnet-4-20250514,anthropic,cobol-modernization,6801,4684,11485,429.120695,True,1.0,claude-sonnet-4-20250514,cobol-modernization,429.120695,True,1.0,True,429.120695 +8969b231-a1a2-423b-815e-4bf4cf94ae76,claude-opus-4-1-20250805,anthropic,log-summary-date-ranges,7694,2151,9845,91.415281,True,1.0,claude-opus-4-1-20250805,log-summary-date-ranges,91.415281,True,0.8888888888888888,True,91.415281 +c936df74-0c2a-4003-a8e9-7678b8b1b0ca,deepseek-ai/DeepSeek-V3.1,together_ai,build-cython-ext,20640,5162,25802,795.004501,False,0.0,deepseek-ai/DeepSeek-V3.1,build-cython-ext,795.004501,False,0.0,False,795.004501 +b9a2fb57-47d2-434c-a42e-445d31204299,gpt-5-nano,openai,build-pov-ray,20466,32026,52492,6019.158278,False,0.0,gpt-5-nano,build-pov-ray,6019.158278,False,0.0,False,6019.158278 +6039b297-c1ce-460a-b6c6-492f6a154c92,deepseek-ai/DeepSeek-V3.1,together_ai,large-scale-text-editing,10829,12560,23389,906.150451,False,0.0,deepseek-ai/DeepSeek-V3.1,large-scale-text-editing,906.150451,False,0.0,False,906.150451 +1ae3b58f-28ca-412b-962d-2e29e0651b17,gpt-5,openai,schemelike-metacircular-eval,13061,24609,37670,2411.939929,False,0.0,gpt-5,schemelike-metacircular-eval,2411.939929,False,0.0,False,2411.939929 +dc2307f9-bb45-42a0-a9d9-98cb6da01938,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,prove-plus-comm,5070,5446,10516,913.233448,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,prove-plus-comm,913.233448,False,0.2,False,913.233448 +b5bf16ef-04e8-4633-8603-da2d849920e5,grok-4-0709,xai,build-initramfs-qemu,5295,4353,9648,900.00104,False,0.0,grok-4-0709,build-initramfs-qemu,900.00104,False,0.0,False,900.00104 +0edb7b99-353c-46c4-a818-5eff90d1df83,gemini-2.5-flash,gemini,distribution-search,44551,50382,94933,3600.053689,False,0.0,gemini-2.5-flash,distribution-search,3600.053689,False,0.0,False,3600.053689 +98cfd85b-4705-4b86-b069-39da3b5dfaf3,gemini-2.5-flash,gemini,model-extraction-relu-logits,2955,5193,8148,904.734862,True,1.0,gemini-2.5-flash,model-extraction-relu-logits,904.734862,True,0.2,True,904.734862 +6d544b26-fd7d-4ef4-8682-50666e5bb0fe,gpt-5-nano,openai,nginx-request-logging,4987,4615,9602,900.667918,False,0.0,gpt-5-nano,nginx-request-logging,900.667918,False,0.0,False,900.667918 +7ed960d8-2fa5-4dda-9db8-a167419401f4,moonshotai/Kimi-K2-Instruct-0905,together_ai,port-compressor,36712,18348,55060,3600.513314,False,0.0,moonshotai/Kimi-K2-Instruct-0905,port-compressor,3600.513314,False,0.0,False,3600.513314 +dfe643eb-2a79-4085-8378-ccdeb30c6a4a,zai-org/GLM-4.5-Air-FP8,together_ai,make-doom-for-mips,18699,6325,25024,905.865221,False,0.0,zai-org/GLM-4.5-Air-FP8,make-doom-for-mips,905.865221,False,0.0,False,905.865221 +f8ba3417-ba0e-4b06-8874-24f5f2e04043,grok-code-fast-1,xai,polyglot-c-py,1203,666,1869,80.655392,False,0.0,grok-code-fast-1,polyglot-c-py,80.655392,False,0.0,False,80.655392 +19f8b9fe-a1fd-40ea-84e1-16d498115663,openai/gpt-oss-120b,together_ai,video-processing,1878,1283,3161,49.491286,False,0.0,openai/gpt-oss-120b,video-processing,49.491286,False,0.0,False,49.491286 +8d3adc34-f187-4fd7-b340-af9148621a19,gpt-5-nano,openai,gpt2-codegolf,1285,1335,2620,102.798116,False,0.0,gpt-5-nano,gpt2-codegolf,102.798116,False,0.0,False,102.798116 +71ba4fdb-231b-4d62-865a-07d941082ef1,gemini-2.5-pro,gemini,bn-fit-modify,18173,4909,23082,1141.810501,False,0.0,gemini-2.5-pro,bn-fit-modify,1141.810501,False,0.0,False,1141.810501 +6bade9a9-4f4d-4a4c-9f47-b3ac7e6a0601,grok-code-fast-1,xai,path-tracing-reverse,9483,5609,15092,855.003376,False,0.0,grok-code-fast-1,path-tracing-reverse,855.003376,False,0.0,False,855.003376 +bb20ae24-0979-4e17-94fc-16bff66a856e,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-recovery,11482,9029,20511,908.910899,False,0.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-recovery,908.910899,False,0.6,False,908.910899 +6c42b8b7-454e-49ce-a596-ee97d6e4f1a4,openai/gpt-oss-120b,together_ai,count-dataset-tokens,3484,1829,5313,173.911279,False,0.0,openai/gpt-oss-120b,count-dataset-tokens,173.911279,False,0.0,False,173.911279 +cbbab881-3117-4bcd-8627-2375f6e76ba7,openai/gpt-oss-120b,together_ai,install-windows-3.11,1433,794,2227,106.370422,False,0.0,openai/gpt-oss-120b,install-windows-3.11,106.370422,False,0.0,False,106.370422 +7c0bb66a-fee2-44a9-a795-ce9b141e0eab,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-cli,16972,13925,30897,941.911409,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-cli,941.911409,False,0.0,False,941.911409 +aba0717e-fae8-4fda-a51c-ad26020e0f94,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-rust-c,4522,3678,8200,389.171353,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-rust-c,389.171353,False,0.0,False,389.171353 +a13e771c-3d30-41a6-b50e-ee754018657c,gemini-2.5-flash,gemini,make-doom-for-mips,6538,4101,10639,236.206561,False,0.0,gemini-2.5-flash,make-doom-for-mips,236.206561,False,0.0,False,236.206561 +0acc683a-338b-457f-b9fb-a7d9f9d733a8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-git,5695,3029,8724,330.564566,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-git,330.564566,True,1.0,True,330.564566 +0aff3637-463e-403b-80cd-fb97af8c5493,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-windows-3.11,16991,10266,27257,1484.71183,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-windows-3.11,1484.71183,False,0.0,False,1484.71183 +b86f0b24-e961-43a0-8712-515abb171646,OpenAI/gpt-oss-20B,together_ai,cobol-modernization,1082,629,1711,914.552962,False,0.0,OpenAI/gpt-oss-20B,cobol-modernization,914.552962,False,0.0,False,914.552962 +cb0a58be-813e-4e99-b67a-5b033eeeeceb,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,train-fasttext,25155,8707,33862,3384.744772,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,train-fasttext,3384.744772,False,0.0,False,3384.744772 +be5c8570-3b01-42c3-8d7b-54cc7e571171,openai/gpt-oss-120b,together_ai,pytorch-model-recovery,22400,19670,42070,900.968414,False,0.0,openai/gpt-oss-120b,pytorch-model-recovery,900.968414,False,0.4,False,900.968414 +36b8b409-f1f9-4459-af0a-3eaa448c3a8b,deepseek-ai/DeepSeek-V3.1,together_ai,break-filter-js-from-html,2467,2578,5045,423.41117,False,0.0,deepseek-ai/DeepSeek-V3.1,break-filter-js-from-html,423.41117,False,0.0,False,423.41117 +17323233-52d7-46e3-9451-02d01b0c8eaa,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,nginx-request-logging,5379,2898,8277,516.70874,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,nginx-request-logging,516.70874,False,0.0,False,516.70874 +352afbf5-0d59-4617-a582-051cc17a0b21,claude-sonnet-4-20250514,anthropic,hf-model-inference,6007,3772,9779,451.788547,False,0.0,claude-sonnet-4-20250514,hf-model-inference,451.788547,False,0.2,False,451.788547 +1ac0e3a1-42a1-44bd-ade4-9d833c77b6e0,OpenAI/gpt-oss-20B,together_ai,sparql-university,546,4775,5321,248.53364,False,0.0,OpenAI/gpt-oss-20B,sparql-university,248.53364,False,0.0,False,248.53364 +25759d41-77bb-486f-abe6-672138e141d6,gemini-2.5-pro,gemini,dna-assembly,9840,4886,14726,657.69496,False,0.0,gemini-2.5-pro,dna-assembly,657.69496,False,0.0,False,657.69496 +911113af-fb85-422f-b760-17ade4dea452,gemini-2.5-flash,gemini,qemu-startup,1207,997,2204,138.383353,True,1.0,gemini-2.5-flash,qemu-startup,138.383353,True,0.2,True,138.383353 +eedd1016-cf0a-4448-a5fe-876954b7edf1,grok-4-0709,xai,gpt2-codegolf,925,402,1327,192.891878,False,0.0,grok-4-0709,gpt2-codegolf,192.891878,False,0.0,False,192.891878 +eb211567-6114-451a-a756-de4601439e6e,gemini-2.5-pro,gemini,reshard-c4-data,8721,4094,12815,280.366479,False,0.0,gemini-2.5-pro,reshard-c4-data,280.366479,False,0.0,False,280.366479 +8227ce3b-f492-42f1-9e3e-9de905181565,claude-opus-4-1-20250805,anthropic,chess-best-move,8682,7206,15888,672.948844,False,0.0,claude-opus-4-1-20250805,chess-best-move,672.948844,False,0.0,False,672.948844 +56ae61d4-faaa-4104-a6df-1b68bcd4ce7b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,gpt2-codegolf,1697,2127,3824,338.160201,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,gpt2-codegolf,338.160201,False,0.0,False,338.160201 +8c798de3-08e7-4311-bb2b-40e93f54be4a,grok-code-fast-1,xai,sqlite-with-gcov,8416,1367,9783,205.526773,False,0.0,grok-code-fast-1,sqlite-with-gcov,205.526773,False,0.2,False,205.526773 +0bfd7a2c-b5c7-4d53-b7bf-383e2215e8ff,gpt-5-mini,openai,torch-tensor-parallelism,2782,2398,5180,240.651863,False,0.0,gpt-5-mini,torch-tensor-parallelism,240.651863,False,0.0,False,240.651863 +165cb0e9-b188-4aea-a751-3c7fda1f7a96,gpt-5-nano,openai,make-doom-for-mips,15521,6029,21550,914.385128,False,0.0,gpt-5-nano,make-doom-for-mips,914.385128,False,0.0,False,914.385128 +19665476-e62b-4db5-bd6d-af1f54c2e1be,gpt-5-mini,openai,break-filter-js-from-html,2839,1890,4729,318.149611,False,0.0,gpt-5-mini,break-filter-js-from-html,318.149611,False,0.0,False,318.149611 +a4ba2774-dfd3-4fd5-bfe7-9dff16d353ed,openai/gpt-oss-120b,together_ai,build-cython-ext,9412,7987,17399,900.540037,False,0.0,openai/gpt-oss-120b,build-cython-ext,900.540037,False,0.0,False,900.540037 +5ed3a276-5b7a-477a-88eb-07a907130ad1,moonshotai/Kimi-K2-Instruct-0905,together_ai,password-recovery,5446,6593,12039,752.412577,False,0.0,moonshotai/Kimi-K2-Instruct-0905,password-recovery,752.412577,False,0.2,False,752.412577 +9239f3c7-d6d0-48ce-9b2c-07953a509501,gpt-5,openai,tune-mjcf,10422,6342,16764,900.000325,False,0.0,gpt-5,tune-mjcf,900.000325,False,0.0,False,900.000325 +15456c0d-f3da-420d-b59d-055c91915343,openai/gpt-oss-120b,together_ai,vulnerable-secret,4414,5397,9811,905.258086,False,0.0,openai/gpt-oss-120b,vulnerable-secret,905.258086,False,0.0,False,905.258086 +b555076b-e922-4a59-aa94-4380848ac011,zai-org/GLM-4.5-Air-FP8,together_ai,filter-js-from-html,14797,15263,30060,949.654966,False,0.0,zai-org/GLM-4.5-Air-FP8,filter-js-from-html,949.654966,False,0.0,False,949.654966 +912644b7-e32f-4db9-8b8b-b482c7609afe,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,reshard-c4-data,4154,2509,6663,408.790879,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reshard-c4-data,408.790879,False,0.0,False,408.790879 +73737a5a-df7a-4cfb-aa78-6e119fc6b6f2,claude-opus-4-1-20250805,anthropic,merge-diff-arc-agi-task,10145,3119,13264,297.197773,True,1.0,claude-opus-4-1-20250805,merge-diff-arc-agi-task,297.197773,True,0.3333333333333333,True,297.197773 +72dec8b9-abef-4db2-9120-ccd6b100adad,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-ocaml-gc,30389,10243,40632,3740.400352,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-ocaml-gc,3740.400352,False,0.0,False,3740.400352 +b91e580b-5594-4a12-b0ad-2d56402df695,gpt-5-nano,openai,prove-plus-comm,2233,2203,4436,393.440593,True,1.0,gpt-5-nano,prove-plus-comm,393.440593,True,0.4,True,393.440593 +4aeedd1e-a433-4484-82d2-839b24e7c502,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,large-scale-text-editing,5285,2931,8216,177.826574,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,large-scale-text-editing,177.826574,False,0.0,False,177.826574 +662b1d6c-0152-4e79-825b-7abfc4602495,grok-code-fast-1,xai,path-tracing-reverse,2587,1995,4582,187.353112,False,0.0,grok-code-fast-1,path-tracing-reverse,187.353112,False,0.0,False,187.353112 +8e34bbc2-6a7f-4a81-8622-3a503dc99f9b,gemini-2.5-pro,gemini,hf-model-inference,4175,1605,5780,162.783819,True,1.0,gemini-2.5-pro,hf-model-inference,162.783819,True,0.8,True,162.783819 +19594301-ef2c-47fd-a231-2775535c8bfc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,large-scale-text-editing,2465,1609,4074,234.161902,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,large-scale-text-editing,234.161902,False,0.0,False,234.161902 +4b4cd1fd-32aa-443d-9e6c-743274ed6410,deepseek-ai/DeepSeek-V3.1,together_ai,chess-best-move,7519,6991,14510,565.509823,False,0.0,deepseek-ai/DeepSeek-V3.1,chess-best-move,565.509823,False,0.0,False,565.509823 +3e9a6a89-ba8b-475d-af05-9fb438faa9d7,deepseek-ai/DeepSeek-V3.1,together_ai,git-leak-recovery,2592,2158,4750,234.1554,False,0.0,deepseek-ai/DeepSeek-V3.1,git-leak-recovery,234.1554,False,0.6,False,234.1554 +7f6f3ec3-d1e6-4cc1-a252-4204d75ebba1,moonshotai/Kimi-K2-Instruct-0905,together_ai,schemelike-metacircular-eval,25247,22920,48167,1933.0568,False,0.0,moonshotai/Kimi-K2-Instruct-0905,schemelike-metacircular-eval,1933.0568,False,0.0,False,1933.0568 +f0be22db-47a1-418c-ba3b-1b00632129f8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,extract-elf,9100,5917,15017,365.057352,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,extract-elf,365.057352,False,0.6,False,365.057352 +79c5d0ad-8a4e-4474-aee7-00feca5cf772,gpt-5,openai,bn-fit-modify,7360,6760,14120,369.170403,True,1.0,gpt-5,bn-fit-modify,369.170403,True,0.5,True,369.170403 +ebd41487-ff39-4a5c-bedc-c0ed11fd5334,grok-4-0709,xai,break-filter-js-from-html,2022,2076,4098,1200.099427,False,0.0,grok-4-0709,break-filter-js-from-html,1200.099427,False,0.0,False,1200.099427 +b8a2939b-6f15-4946-be28-9acca4d43b30,zai-org/GLM-4.5-Air-FP8,together_ai,fix-code-vulnerability,15695,11250,26945,423.313306,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-code-vulnerability,423.313306,False,0.0,False,423.313306 +39a66b04-2c14-4dbe-8f26-410f4e360fba,grok-4-0709,xai,log-summary-date-ranges,5542,5076,10618,914.86037,False,0.0,grok-4-0709,log-summary-date-ranges,914.86037,False,0.0,False,914.86037 +021d5735-c51b-41ac-aa15-5f8f320f0b52,gpt-5,openai,git-leak-recovery,7244,9419,16663,900.001982,False,0.0,gpt-5,git-leak-recovery,900.001982,False,0.7142857142857143,False,900.001982 +90878e4b-cb20-4e13-a9b3-9fa20111a1c7,zai-org/GLM-4.5-Air-FP8,together_ai,reverse-engineering,24172,13169,37341,1820.35783,False,0.0,zai-org/GLM-4.5-Air-FP8,reverse-engineering,1820.35783,False,0.0,False,1820.35783 +7bda02fa-0aea-48c7-8d34-9785892edeaf,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-assembly,10825,2692,13517,279.236747,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-assembly,279.236747,False,0.0,False,279.236747 +6fba9039-2326-4468-8474-0e2ddad0ca61,OpenAI/gpt-oss-20B,together_ai,mteb-retrieve,2313,775,3088,171.410954,False,0.0,OpenAI/gpt-oss-20B,mteb-retrieve,171.410954,False,0.0,False,171.410954 +e5fa7fe4-5449-41be-b98f-4cd16b03b822,gemini-2.5-flash,gemini,dna-insert,4743,309,5052,360.961252,False,0.0,gemini-2.5-flash,dna-insert,360.961252,False,0.0,False,360.961252 +432c868e-25b4-4359-95af-dbb34a4b2d7d,claude-opus-4-1-20250805,anthropic,crack-7z-hash,8898,3038,11936,556.88633,True,1.0,claude-opus-4-1-20250805,crack-7z-hash,556.88633,True,0.8888888888888888,True,556.88633 +0e217f67-8ed7-4304-b746-18b4136d6c74,grok-4-0709,xai,cancel-async-tasks,1048,603,1651,104.888625,False,0.0,grok-4-0709,cancel-async-tasks,104.888625,False,0.0,False,104.888625 +ce530fcb-77da-4c3f-b7ed-4696d0fe9d11,claude-opus-4-1-20250805,anthropic,feal-differential-cryptanalysis,41427,44691,86118,1800.001361,False,0.0,claude-opus-4-1-20250805,feal-differential-cryptanalysis,1800.001361,False,0.0,False,1800.001361 +8636c2e5-4372-491f-bbbb-4e44240a9a64,claude-sonnet-4-20250514,anthropic,merge-diff-arc-agi-task,15854,9202,25056,811.21892,False,0.0,claude-sonnet-4-20250514,merge-diff-arc-agi-task,811.21892,False,0.0,False,811.21892 +464cd2a9-bd38-4f3a-aa3a-88d5711fe689,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,git-leak-recovery,3345,2897,6242,855.601774,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,git-leak-recovery,855.601774,True,1.0,True,855.601774 +261eac40-4ac0-4533-8a6c-1ace515affeb,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-linear-cryptanalysis,8518,6150,14668,748.764668,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-linear-cryptanalysis,748.764668,False,0.0,False,748.764668 +6bd4f311-3a61-44eb-b4a8-f5aed32fac9f,openai/gpt-oss-120b,together_ai,pytorch-model-cli,1451,1304,2755,35.28571,False,0.0,openai/gpt-oss-120b,pytorch-model-cli,35.28571,False,0.0,False,35.28571 +07cc1a7c-2b8e-43a8-b6ae-4236a0062451,claude-sonnet-4-20250514,anthropic,bn-fit-modify,22164,8988,31152,644.112219,True,1.0,claude-sonnet-4-20250514,bn-fit-modify,644.112219,True,0.8,True,644.112219 +3d697603-9e53-456b-91ce-e7619363c6b2,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-linear-cryptanalysis,14428,10851,25279,2443.52322,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-linear-cryptanalysis,2443.52322,False,0.0,False,2443.52322 +972a00a6-60a6-4ec3-928f-199ea182a3d1,OpenAI/gpt-oss-20B,together_ai,install-windows-3.11,14458,31004,45462,1510.922286,False,0.0,OpenAI/gpt-oss-20B,install-windows-3.11,1510.922286,False,0.0,False,1510.922286 +5e318720-a337-45a0-84ab-c68b187d81b7,gemini-2.5-flash,gemini,form-filling,10876,10588,21464,417.453321,False,0.0,gemini-2.5-flash,form-filling,417.453321,False,0.0,False,417.453321 +3081e06c-eebf-4d7c-857a-8dff22e4b6ab,openai/gpt-oss-120b,together_ai,break-filter-js-from-html,2176,533,2709,72.120748,False,0.0,openai/gpt-oss-120b,break-filter-js-from-html,72.120748,False,0.0,False,72.120748 +cf232c56-6d3c-4d64-bb1d-1c0d5617cabf,gemini-2.5-pro,gemini,polyglot-rust-c,2484,2314,4798,297.3684,False,0.0,gemini-2.5-pro,polyglot-rust-c,297.3684,False,0.0,False,297.3684 +808c2f0d-d7bf-4317-8288-6c2c209c3bf4,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-insert,11092,2714,13806,630.574918,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-insert,630.574918,False,0.0,False,630.574918 +81e97aca-9980-4470-ad77-a7032a80b237,gemini-2.5-flash,gemini,circuit-fibsqrt,37927,87883,125810,3287.977055,False,0.0,gemini-2.5-flash,circuit-fibsqrt,3287.977055,False,0.0,False,3287.977055 +ba624593-febe-42ae-a91f-334a70e333ca,gpt-5,openai,gpt2-codegolf,2647,3264,5911,990.828439,False,0.0,gpt-5,gpt2-codegolf,990.828439,False,0.0,False,990.828439 +7ea95c77-9dbe-4cc8-a350-432681a3394a,claude-opus-4-1-20250805,anthropic,sqlite-db-truncate,7965,4212,12177,278.391312,False,0.0,claude-opus-4-1-20250805,sqlite-db-truncate,278.391312,False,0.125,False,278.391312 +963bc5ef-b5f7-4b98-83fc-c806208a1972,openai/gpt-oss-120b,together_ai,build-cython-ext,7424,3510,10934,902.247733,False,0.0,openai/gpt-oss-120b,build-cython-ext,902.247733,False,0.0,False,902.247733 +952cc713-1d2f-4139-bea0-8b94b5d99e77,gpt-5,openai,password-recovery,4434,5221,9655,900.702539,False,0.0,gpt-5,password-recovery,900.702539,False,0.0,False,900.702539 +ad45fd05-7098-434d-8dea-e086a8e9c296,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,count-dataset-tokens,16381,3828,20209,974.345603,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,count-dataset-tokens,974.345603,False,0.0,False,974.345603 +3c4c26ed-5b4c-4d86-a976-10f834b4aaec,gemini-2.5-flash,gemini,pytorch-model-recovery,17565,12925,30490,640.553611,True,1.0,gemini-2.5-flash,pytorch-model-recovery,640.553611,True,0.2,True,640.553611 +8c7af778-3908-402a-baa1-d28cff72d4ae,claude-sonnet-4-20250514,anthropic,pytorch-model-recovery,5627,5349,10976,547.444523,True,1.0,claude-sonnet-4-20250514,pytorch-model-recovery,547.444523,True,1.0,True,547.444523 +ed573b9e-4911-4c60-b655-0a1ae0c8be72,gpt-5-nano,openai,cobol-modernization,13127,13527,26654,915.022057,True,1.0,gpt-5-nano,cobol-modernization,915.022057,True,0.4,True,915.022057 +09eb0f32-fe90-4b5f-8ac8-b98abf8824fb,openai/gpt-oss-120b,together_ai,install-klee-minimal,1591,1419,3010,440.05567,False,0.0,openai/gpt-oss-120b,install-klee-minimal,440.05567,False,0.0,False,440.05567 +867ebf83-d157-4139-b30e-b983d7fb42e6,gpt-5,openai,mteb-retrieve,1868,813,2681,118.223015,False,0.0,gpt-5,mteb-retrieve,118.223015,False,0.0,False,118.223015 +0295b364-9818-43be-9fb6-e0a0d3bc0aa5,openai/gpt-oss-120b,together_ai,extract-elf,4145,4967,9112,232.823262,False,0.0,openai/gpt-oss-120b,extract-elf,232.823262,False,0.4,False,232.823262 +a742096c-f8d9-4d04-9d79-c00645ff09a8,grok-4-0709,xai,fix-git,2079,1845,3924,245.989973,True,1.0,grok-4-0709,fix-git,245.989973,True,1.0,True,245.989973 +11ece640-c17f-4af1-88bf-20f086da909f,gpt-5-nano,openai,constraints-scheduling,9621,11268,20889,828.407854,True,1.0,gpt-5-nano,constraints-scheduling,828.407854,True,0.4,True,828.407854 +6046336b-df29-46ae-b9c8-e05953dbc3a5,gpt-5-nano,openai,dna-insert,6518,5009,11527,377.771084,False,0.0,gpt-5-nano,dna-insert,377.771084,False,0.0,False,377.771084 +9b5f79b7-4cae-46fe-af17-9089d001ff9a,gpt-5-nano,openai,model-extraction-relu-logits,1817,2494,4311,175.789692,False,0.0,gpt-5-nano,model-extraction-relu-logits,175.789692,False,0.0,False,175.789692 +e64fccba-96bb-40ba-ace7-289de375f3a4,grok-code-fast-1,xai,fix-code-vulnerability,16678,4176,20854,344.88578,False,0.0,grok-code-fast-1,fix-code-vulnerability,344.88578,False,0.0,False,344.88578 +6c9765f8-dac9-4171-8457-118327cc7f2a,gpt-5,openai,reshard-c4-data,5839,5547,11386,573.289721,False,0.0,gpt-5,reshard-c4-data,573.289721,False,0.3333333333333333,False,573.289721 +74521611-61df-4af6-aa93-efc2214ec6eb,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-recovery,17758,15878,33636,900.00613,False,0.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-recovery,900.00613,False,0.4,False,900.00613 +d2edec26-1382-4e3a-a570-eb55de09f260,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-db-truncate,2689,1598,4287,147.813211,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-db-truncate,147.813211,False,0.0,False,147.813211 +038bb50c-ccdc-4445-b3de-9dd8fc634fb8,gpt-5-nano,openai,hf-model-inference,11973,10580,22553,919.773131,False,0.0,gpt-5-nano,hf-model-inference,919.773131,False,0.4,False,919.773131 +594d949b-996a-455e-a8e9-ed0b73e43599,zai-org/GLM-4.5-Air-FP8,together_ai,model-extraction-relu-logits,1290,1380,2670,1420.756777,False,0.0,zai-org/GLM-4.5-Air-FP8,model-extraction-relu-logits,1420.756777,False,0.2,False,1420.756777 +b7c1c784-0825-45ea-b9b7-ea5f5cdef6ad,gpt-5-nano,openai,git-leak-recovery,3635,4783,8418,901.068127,False,0.0,gpt-5-nano,git-leak-recovery,901.068127,False,0.0,False,901.068127 +2056f705-23a7-4bc5-9a40-e65cd1988135,claude-opus-4-1-20250805,anthropic,polyglot-c-py,13461,9411,22872,823.248162,False,0.0,claude-opus-4-1-20250805,polyglot-c-py,823.248162,False,0.0,False,823.248162 +2eebefca-c851-487b-a2dd-c01eb85cafe2,gpt-5,openai,vulnerable-secret,13266,7810,21076,485.781482,True,1.0,gpt-5,vulnerable-secret,485.781482,True,0.2857142857142857,True,485.781482 +4eb85de0-9c15-4f90-9c4b-8ba3a150dca7,gpt-5,openai,form-filling,9835,11242,21077,541.252707,True,1.0,gpt-5,form-filling,541.252707,True,0.8,True,541.252707 +7415e9c8-bec2-4af8-a5d4-07ecd3aad706,openai/gpt-oss-120b,together_ai,git-leak-recovery,1294,645,1939,62.324182,False,0.0,openai/gpt-oss-120b,git-leak-recovery,62.324182,False,0.2,False,62.324182 +a1858cc5-7c88-4858-ba02-1e84f2695806,zai-org/GLM-4.5-Air-FP8,together_ai,code-from-image,12939,13513,26452,1224.048082,False,0.0,zai-org/GLM-4.5-Air-FP8,code-from-image,1224.048082,False,0.2,False,1224.048082 +5b83c9c7-c005-4a95-89be-846ae500efc3,gemini-2.5-flash,gemini,gpt2-codegolf,1892,1778,3670,96.970774,False,0.0,gemini-2.5-flash,gpt2-codegolf,96.970774,False,0.0,False,96.970774 +6b160cb1-2a3d-4543-b97d-7e66763896b6,grok-code-fast-1,xai,count-dataset-tokens,11464,4181,15645,773.919599,False,0.0,grok-code-fast-1,count-dataset-tokens,773.919599,False,0.0,False,773.919599 +1ae5f9d3-733a-4930-a440-b86338c76a50,gemini-2.5-flash,gemini,polyglot-c-py,1387,13287,14674,514.70736,False,0.0,gemini-2.5-flash,polyglot-c-py,514.70736,False,0.0,False,514.70736 +e032ad69-aba7-40f8-aee1-d6bd8a312d6c,claude-opus-4-1-20250805,anthropic,make-doom-for-mips,26895,9864,36759,900.90212,False,0.0,claude-opus-4-1-20250805,make-doom-for-mips,900.90212,False,0.0,False,900.90212 +68d1e3dc-8936-4ec9-88d4-b0d3c066bfba,gpt-5,openai,configure-git-webserver,5976,2396,8372,778.7174,True,1.0,gpt-5,configure-git-webserver,778.7174,True,1.0,True,778.7174 +715fe238-1426-430a-a999-ebb63323271c,grok-code-fast-1,xai,regex-log,1371,673,2044,53.534082,False,0.0,grok-code-fast-1,regex-log,53.534082,False,0.0,False,53.534082 +c7b1a0eb-85fd-487d-b75e-75dfec728222,grok-4-0709,xai,configure-git-webserver,4571,872,5443,406.447578,False,0.0,grok-4-0709,configure-git-webserver,406.447578,False,0.0,False,406.447578 +feec636a-19bd-45ec-be2b-47680f32dd44,zai-org/GLM-4.5-Air-FP8,together_ai,configure-git-webserver,4772,2211,6983,321.276225,False,0.0,zai-org/GLM-4.5-Air-FP8,configure-git-webserver,321.276225,False,0.0,False,321.276225 +c6bf4b33-112b-48a8-b43d-2d148873923b,deepseek-ai/DeepSeek-V3.1,together_ai,financial-document-processor,9226,4525,13751,1236.746396,False,0.0,deepseek-ai/DeepSeek-V3.1,financial-document-processor,1236.746396,False,0.0,False,1236.746396 +30faa2f0-06a9-45ed-b6fe-484514542f19,grok-code-fast-1,xai,build-cython-ext,10913,5958,16871,912.264186,False,0.0,grok-code-fast-1,build-cython-ext,912.264186,False,0.0,False,912.264186 +e0197869-c39e-46de-9997-f166d5f72c42,gpt-5-nano,openai,dna-insert,6781,4083,10864,262.533636,False,0.0,gpt-5-nano,dna-insert,262.533636,False,0.0,False,262.533636 +8193060e-51ff-46e6-8e53-128f96fb32e3,moonshotai/Kimi-K2-Instruct-0905,together_ai,merge-diff-arc-agi-task,14162,7176,21338,900.884919,False,0.0,moonshotai/Kimi-K2-Instruct-0905,merge-diff-arc-agi-task,900.884919,False,0.0,False,900.884919 +ceabc53b-4446-46d0-a5cf-6fe825f4990c,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-with-gcov,11236,2714,13950,720.762943,True,1.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-with-gcov,720.762943,True,0.4,True,720.762943 +7f16a20d-a5f5-49bf-86f9-b0239a6436ed,claude-opus-4-1-20250805,anthropic,crack-7z-hash,7666,4889,12555,356.500901,True,1.0,claude-opus-4-1-20250805,crack-7z-hash,356.500901,True,0.8888888888888888,True,356.500901 +57e04059-2ca8-488a-b431-77f66ff880e9,moonshotai/Kimi-K2-Instruct-0905,together_ai,write-compressor,10392,11402,21794,782.580816,False,0.0,moonshotai/Kimi-K2-Instruct-0905,write-compressor,782.580816,False,0.0,False,782.580816 +e14921d8-3dcc-4de4-8966-81852fc9304b,moonshotai/Kimi-K2-Instruct-0905,together_ai,form-filling,9373,7886,17259,676.929552,True,1.0,moonshotai/Kimi-K2-Instruct-0905,form-filling,676.929552,True,0.8,True,676.929552 +35888e4c-8afd-4d05-b235-7304a4b4ccce,grok-code-fast-1,xai,qemu-startup,1020,757,1777,502.770008,False,0.0,grok-code-fast-1,qemu-startup,502.770008,False,0.0,False,502.770008 +87f64194-cdc8-4a5d-a270-d0f7374ccb12,gpt-5-mini,openai,dna-assembly,14778,14666,29444,737.071645,False,0.0,gpt-5-mini,dna-assembly,737.071645,False,0.0,False,737.071645 +9eedf61d-f886-4eb5-a63e-ab796ff7ebc0,gemini-2.5-flash,gemini,pytorch-model-recovery,17464,15163,32627,900.953317,False,0.0,gemini-2.5-flash,pytorch-model-recovery,900.953317,False,0.2,False,900.953317 +c9ec3100-e9e8-44d8-ae46-2e5bc7dfb6af,gpt-5-nano,openai,regex-log,4035,5003,9038,2352.316519,False,0.0,gpt-5-nano,regex-log,2352.316519,False,0.2,False,2352.316519 +75b1b712-5faf-4445-898a-0e9c29bb719b,gpt-5-mini,openai,largest-eigenval,13225,10412,23637,902.54655,False,0.0,gpt-5-mini,largest-eigenval,902.54655,False,0.0,False,902.54655 +f704e922-ad3d-4cba-a54a-c1cbda8203dc,claude-opus-4-1-20250805,anthropic,cobol-modernization,7598,4509,12107,435.361757,True,1.0,claude-opus-4-1-20250805,cobol-modernization,435.361757,True,0.875,True,435.361757 +2bdb51b4-7f78-4e61-8138-6f4fc392d3ca,gemini-2.5-flash,gemini,break-filter-js-from-html,1705,2211,3916,119.978262,False,0.0,gemini-2.5-flash,break-filter-js-from-html,119.978262,False,0.0,False,119.978262 +235e0bdf-a8ec-4ba4-9444-3ea33cdb0071,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-git,4263,3324,7587,897.086075,True,1.0,moonshotai/Kimi-K2-Instruct-0905,fix-git,897.086075,True,1.0,True,897.086075 +c083db2f-7c25-457c-af72-a1a38065746f,claude-sonnet-4-20250514,anthropic,model-extraction-relu-logits,6870,6502,13372,718.960034,False,0.0,claude-sonnet-4-20250514,model-extraction-relu-logits,718.960034,False,0.0,False,718.960034 +456e82cb-028e-40a4-b978-e5aa0e6ef84d,claude-opus-4-1-20250805,anthropic,pytorch-model-cli,14685,5272,19957,379.893183,False,0.0,claude-opus-4-1-20250805,pytorch-model-cli,379.893183,False,0.4285714285714285,False,379.893183 +0358c863-4758-404c-a034-94d684264187,zai-org/GLM-4.5-Air-FP8,together_ai,wasm-pipeline,5674,4543,10217,1033.663767,False,0.0,zai-org/GLM-4.5-Air-FP8,wasm-pipeline,1033.663767,False,0.2,False,1033.663767 +a9479dd6-30e5-445c-a333-616e0e505c1f,gpt-5-mini,openai,sparql-university,5398,3327,8725,263.766192,False,0.0,gpt-5-mini,sparql-university,263.766192,False,0.0,False,263.766192 +ea8b6f01-a531-4a8f-96ba-24eaa49ef8ab,gpt-5,openai,polyglot-c-py,1547,1431,2978,663.855689,False,0.0,gpt-5,polyglot-c-py,663.855689,False,0.0,False,663.855689 +2142963b-efa7-41e0-9d18-74da4e6db6d7,gpt-5-nano,openai,chess-best-move,1268,888,2156,92.702976,False,0.0,gpt-5-nano,chess-best-move,92.702976,False,0.0,False,92.702976 +c8c67d8c-d6a3-4f00-9d2f-447353538b74,deepseek-ai/DeepSeek-V3.1,together_ai,code-from-image,16630,8760,25390,1225.531146,False,0.0,deepseek-ai/DeepSeek-V3.1,code-from-image,1225.531146,False,0.6,False,1225.531146 +595d1939-2424-4366-bd42-beedd35b8b32,moonshotai/Kimi-K2-Instruct-0905,together_ai,pypi-server,5476,4351,9827,793.433323,True,1.0,moonshotai/Kimi-K2-Instruct-0905,pypi-server,793.433323,True,0.2,True,793.433323 +efac70da-c352-4c81-bd24-539ad85b4ac4,gpt-5-nano,openai,filter-js-from-html,5417,5632,11049,407.989321,False,0.0,gpt-5-nano,filter-js-from-html,407.989321,False,0.0,False,407.989321 +ed22019e-8b53-423e-87c8-4dd2ce68fba2,grok-4-0709,xai,feal-linear-cryptanalysis,3577,1589,5166,2322.54027,False,0.0,grok-4-0709,feal-linear-cryptanalysis,2322.54027,False,0.0,False,2322.54027 +70adc40b-624b-4249-b8c4-71265ef42d2a,OpenAI/gpt-oss-20B,together_ai,break-filter-js-from-html,1216,2081,3297,247.076007,False,0.0,OpenAI/gpt-oss-20B,break-filter-js-from-html,247.076007,False,0.0,False,247.076007 +030c60e1-980a-414e-9370-01d3a19ec68a,moonshotai/Kimi-K2-Instruct-0905,together_ai,password-recovery,6708,6343,13051,913.513438,False,0.0,moonshotai/Kimi-K2-Instruct-0905,password-recovery,913.513438,False,0.2,False,913.513438 +eccf9b86-76f0-463e-9749-36dcfa9063cc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,reshard-c4-data,8373,4031,12404,480.301997,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reshard-c4-data,480.301997,False,0.0,False,480.301997 +59a45a77-b0fc-4bd8-8fde-4f2435ccc621,claude-opus-4-1-20250805,anthropic,password-recovery,7111,3949,11060,667.830922,True,1.0,claude-opus-4-1-20250805,password-recovery,667.830922,True,0.5555555555555556,True,667.830922 +6e206e4c-f793-41da-974d-28d2cb49d0db,openai/gpt-oss-120b,together_ai,qemu-startup,2148,2323,4471,166.744352,False,0.0,openai/gpt-oss-120b,qemu-startup,166.744352,False,0.0,False,166.744352 +4c648cc5-b1de-4b3b-9bbf-e5f67ad51931,gpt-5-mini,openai,hf-model-inference,2646,2167,4813,255.82004,True,1.0,gpt-5-mini,hf-model-inference,255.82004,True,0.8,True,255.82004 +b32993da-a8b6-42d7-8e0f-bfcdd006fd9e,claude-opus-4-1-20250805,anthropic,merge-diff-arc-agi-task,7411,1861,9272,917.497024,False,0.0,claude-opus-4-1-20250805,merge-diff-arc-agi-task,917.497024,False,0.3333333333333333,False,917.497024 +468d8c01-08f0-45ea-8cf3-e912e6067987,claude-opus-4-1-20250805,anthropic,sanitize-git-repo,7155,2612,9767,900.00212,False,0.0,claude-opus-4-1-20250805,sanitize-git-repo,900.00212,False,0.0,False,900.00212 +339fe229-79dd-4d78-9ca7-79eb2cc78b90,grok-code-fast-1,xai,tune-mjcf,7012,6121,13133,868.599159,False,0.0,grok-code-fast-1,tune-mjcf,868.599159,False,0.4,False,868.599159 +d9238b7c-668e-4609-b5e5-0348a0f792f4,deepseek-ai/DeepSeek-V3.1,together_ai,code-from-image,4173,3700,7873,163.461342,False,0.0,deepseek-ai/DeepSeek-V3.1,code-from-image,163.461342,False,0.6,False,163.461342 +030f820b-00df-4821-9836-bda4f095663d,deepseek-ai/DeepSeek-V3.1,together_ai,git-leak-recovery,2707,2246,4953,143.5472,True,1.0,deepseek-ai/DeepSeek-V3.1,git-leak-recovery,143.5472,True,0.6,True,143.5472 +754df405-0db1-4e46-807b-959f2fa530a7,openai/gpt-oss-120b,together_ai,reverse-engineering,12492,10353,22845,1801.939504,False,0.0,openai/gpt-oss-120b,reverse-engineering,1801.939504,False,0.2,False,1801.939504 +852834ef-c68a-46c2-8b92-2bc2682619cd,deepseek-ai/DeepSeek-V3.1,together_ai,code-from-image,23360,13835,37195,1137.019798,True,1.0,deepseek-ai/DeepSeek-V3.1,code-from-image,1137.019798,True,0.6,True,1137.019798 +84cac82c-cf22-42ea-a3e6-aff009f532ce,deepseek-ai/DeepSeek-V3.1,together_ai,fix-git,7018,3260,10278,198.331857,True,1.0,deepseek-ai/DeepSeek-V3.1,fix-git,198.331857,True,0.8,True,198.331857 +97130dad-35ce-4177-bf17-58dbc95f4658,zai-org/GLM-4.5-Air-FP8,together_ai,nginx-request-logging,6022,4175,10197,75.09853,True,1.0,zai-org/GLM-4.5-Air-FP8,nginx-request-logging,75.09853,True,1.0,True,75.09853 +e6b7f583-3355-41c2-9414-dcfe10720c51,gpt-5-nano,openai,crack-7z-hash,4227,2479,6706,171.686959,False,0.0,gpt-5-nano,crack-7z-hash,171.686959,False,0.0,False,171.686959 +45b52d22-2f0f-4e1f-8049-351aa0cf95e2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,gpt2-codegolf,2394,2368,4762,276.500254,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,gpt2-codegolf,276.500254,False,0.0,False,276.500254 +930aa83e-b2de-4276-beb6-732ac8381ff5,grok-4-0709,xai,constraints-scheduling,3603,1252,4855,666.853623,True,1.0,grok-4-0709,constraints-scheduling,666.853623,True,0.8,True,666.853623 +3112ec9d-e5e1-4832-a612-c18f38016c19,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-alpine-ssh,7877,8849,16726,916.004436,False,0.0,zai-org/GLM-4.5-Air-FP8,qemu-alpine-ssh,916.004436,False,0.0,False,916.004436 +73134e5c-f967-4229-80a9-1c8da840cbec,zai-org/GLM-4.5-Air-FP8,together_ai,write-compressor,11443,13048,24491,900.281979,False,0.0,zai-org/GLM-4.5-Air-FP8,write-compressor,900.281979,False,0.0,False,900.281979 +c3130136-d5b3-4e6c-927c-b0a70c24d317,claude-sonnet-4-20250514,anthropic,build-pmars,16622,3797,20419,314.732475,True,1.0,claude-sonnet-4-20250514,build-pmars,314.732475,True,0.6,True,314.732475 +63a03bce-761e-4b8f-86a8-587a34f7098d,deepseek-ai/DeepSeek-V3.1,together_ai,winning-avg-corewars,13327,11757,25084,650.885878,False,0.0,deepseek-ai/DeepSeek-V3.1,winning-avg-corewars,650.885878,False,0.0,False,650.885878 +05446873-ba91-483b-a235-2e70ce73e0b3,claude-sonnet-4-20250514,anthropic,install-klee-minimal,25999,4317,30316,900.508385,False,0.0,claude-sonnet-4-20250514,install-klee-minimal,900.508385,False,0.0,False,900.508385 +d613cc38-4fa2-498a-9974-7a45106c6241,gemini-2.5-flash,gemini,run-pdp11-code,11099,8180,19279,1009.787953,False,0.0,gemini-2.5-flash,run-pdp11-code,1009.787953,False,0.0,False,1009.787953 +6b7dbe2b-f483-47dc-8f83-cce61d6b8e92,openai/gpt-oss-120b,together_ai,password-recovery,1245,921,2166,367.672835,False,0.0,openai/gpt-oss-120b,password-recovery,367.672835,False,0.2,False,367.672835 +385d4f26-dc27-4699-b932-3d2166191eb9,claude-opus-4-1-20250805,anthropic,write-compressor,3553,1549,5102,1416.71387,False,0.0,claude-opus-4-1-20250805,write-compressor,1416.71387,False,0.0,False,1416.71387 +b5995c9d-2352-41c7-b551-3aef028555e1,gpt-5-nano,openai,largest-eigenval,4806,4088,8894,179.300111,False,0.0,gpt-5-nano,largest-eigenval,179.300111,False,0.0,False,179.300111 +ed7b84dd-bba2-4bea-9a52-6e17019578f4,grok-4-0709,xai,configure-git-webserver,4491,660,5151,336.824078,False,0.0,grok-4-0709,configure-git-webserver,336.824078,False,0.0,False,336.824078 +14b76156-e9d7-499a-bf38-fab27278a18e,gpt-5-nano,openai,schemelike-metacircular-eval,6584,12881,19465,2401.299745,False,0.0,gpt-5-nano,schemelike-metacircular-eval,2401.299745,False,0.2,False,2401.299745 +96560608-d32c-4317-96fd-0db05f68b7ff,claude-sonnet-4-20250514,anthropic,cancel-async-tasks,3036,3040,6076,429.56147,False,0.0,claude-sonnet-4-20250514,cancel-async-tasks,429.56147,False,0.8,False,429.56147 +c35e2f16-6867-405d-b240-2ab7d3bfe85a,claude-opus-4-1-20250805,anthropic,torch-tensor-parallelism,2269,1603,3872,45.158359,False,0.0,claude-opus-4-1-20250805,torch-tensor-parallelism,45.158359,False,0.0,False,45.158359 +7b7d890c-264c-498b-b2ae-0e82d054f32f,grok-4-0709,xai,cobol-modernization,3317,1534,4851,900.722841,False,0.0,grok-4-0709,cobol-modernization,900.722841,False,0.2,False,900.722841 +5978e7ea-58bd-4d7d-985d-f47af32519db,claude-opus-4-1-20250805,anthropic,path-tracing,26044,20941,46985,1804.230985,False,0.0,claude-opus-4-1-20250805,path-tracing,1804.230985,False,0.0,False,1804.230985 +87d3e970-3208-439e-844d-357a468e3946,zai-org/GLM-4.5-Air-FP8,together_ai,sparql-university,6684,3478,10162,146.77914,False,0.0,zai-org/GLM-4.5-Air-FP8,sparql-university,146.77914,False,0.0,False,146.77914 +b681f844-aaf0-4c6c-a787-f96ef4612a72,openai/gpt-oss-120b,together_ai,password-recovery,1497,1029,2526,107.874483,True,1.0,openai/gpt-oss-120b,password-recovery,107.874483,True,0.2,True,107.874483 +3e00f1f2-f771-4354-9550-ab94b95060d0,claude-opus-4-1-20250805,anthropic,video-processing,3821,3121,6942,298.359356,False,0.0,claude-opus-4-1-20250805,video-processing,298.359356,False,0.0,False,298.359356 +400e8377-a400-41c1-b54c-bd2768af7556,gemini-2.5-flash,gemini,path-tracing,2361,7058,9419,346.891061,False,0.0,gemini-2.5-flash,path-tracing,346.891061,False,0.0,False,346.891061 +718354f9-1540-47bb-a84e-afad16a8902d,gpt-5-nano,openai,circuit-fibsqrt,77745,43772,121517,3606.240286,False,0.0,gpt-5-nano,circuit-fibsqrt,3606.240286,False,0.0,False,3606.240286 +4f236017-9f74-4364-81f7-7d15610c8391,gpt-5-nano,openai,sqlite-db-truncate,6569,7936,14505,907.407995,False,0.0,gpt-5-nano,sqlite-db-truncate,907.407995,False,0.0,False,907.407995 +5403e91f-05ca-4b8e-a964-3c117c60bc5f,deepseek-ai/DeepSeek-V3.1,together_ai,fix-ocaml-gc,25984,8796,34780,3705.862011,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-ocaml-gc,3705.862011,False,0.0,False,3705.862011 +dcb775a5-e9a4-4a7b-8e39-80d43e4438ed,deepseek-ai/DeepSeek-V3.1,together_ai,log-summary-date-ranges,8720,3298,12018,288.142412,True,1.0,deepseek-ai/DeepSeek-V3.1,log-summary-date-ranges,288.142412,True,0.4,True,288.142412 +19665595-97d4-435b-b595-bcf3f2948477,gpt-5-mini,openai,torch-tensor-parallelism,3447,3558,7005,186.701528,False,0.0,gpt-5-mini,torch-tensor-parallelism,186.701528,False,0.0,False,186.701528 +00814575-1545-4f5c-b500-9745e3084412,gemini-2.5-pro,gemini,mteb-retrieve,2161,1194,3355,169.302086,False,0.0,gemini-2.5-pro,mteb-retrieve,169.302086,False,0.0,False,169.302086 +1629cd15-cab0-4e66-ac31-b62e391a69e0,gemini-2.5-pro,gemini,constraints-scheduling,4864,2661,7525,476.403029,True,1.0,gemini-2.5-pro,constraints-scheduling,476.403029,True,1.0,True,476.403029 +a77a7663-92ac-4404-8432-dfae4a94f971,gpt-5,openai,vulnerable-secret,6767,4722,11489,923.786604,False,0.0,gpt-5,vulnerable-secret,923.786604,False,0.2857142857142857,False,923.786604 +ef80d46c-70a9-4a33-a02f-15c011616e29,grok-code-fast-1,xai,form-filling,3920,2734,6654,204.388012,False,0.0,grok-code-fast-1,form-filling,204.388012,False,0.6,False,204.388012 +43edcb06-f3dd-413a-8283-39e6fc5f680e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,circuit-fibsqrt,33677,40913,74590,3615.228631,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,circuit-fibsqrt,3615.228631,False,0.0,False,3615.228631 +a2d67299-86f3-451a-9c1d-48d3e8068626,claude-opus-4-1-20250805,anthropic,dna-insert,7629,5867,13496,360.012105,False,0.0,claude-opus-4-1-20250805,dna-insert,360.012105,False,0.0,False,360.012105 +1eb170f7-f27f-4f59-b7a7-2927e1ce68c8,claude-sonnet-4-20250514,anthropic,constraints-scheduling,6474,4750,11224,477.372967,True,1.0,claude-sonnet-4-20250514,constraints-scheduling,477.372967,True,1.0,True,477.372967 +3302e888-31c8-4c5e-ac13-658696faaac2,claude-opus-4-1-20250805,anthropic,form-filling,7896,5924,13820,644.983843,True,1.0,claude-opus-4-1-20250805,form-filling,644.983843,True,1.0,True,644.983843 +9b6eac77-21b8-4a70-8b9a-77657693efd6,OpenAI/gpt-oss-20B,together_ai,pytorch-model-cli,667,713,1380,125.023286,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-cli,125.023286,False,0.0,False,125.023286 +68b352f1-22f0-4fcb-896a-4febdd537cc7,claude-opus-4-1-20250805,anthropic,reshard-c4-data,8739,7737,16476,599.941002,False,0.0,claude-opus-4-1-20250805,reshard-c4-data,599.941002,False,0.0,False,599.941002 +2442d7a0-f4d3-4d39-8e66-328c910d1a6e,deepseek-ai/DeepSeek-V3.1,together_ai,make-doom-for-mips,22424,3803,26227,806.154215,False,0.0,deepseek-ai/DeepSeek-V3.1,make-doom-for-mips,806.154215,False,0.0,False,806.154215 +c3be3873-dfd1-44ad-a02f-df4888b8fd32,claude-opus-4-1-20250805,anthropic,circuit-fibsqrt,18875,16866,35741,1077.280833,False,0.0,claude-opus-4-1-20250805,circuit-fibsqrt,1077.280833,False,0.0,False,1077.280833 +2e05751a-d205-45d1-809f-f0b08d5c960f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-assembly,14185,9680,23865,756.249183,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-assembly,756.249183,False,0.0,False,756.249183 +c1a1c713-f23f-4ecb-8c5e-65013e98ff1a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,write-compressor,9577,9746,19323,904.311186,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,write-compressor,904.311186,False,0.0,False,904.311186 +2442eec9-28bf-4b5f-9032-3db54b84e24b,gemini-2.5-flash,gemini,gpt2-codegolf,2375,5007,7382,563.656472,False,0.0,gemini-2.5-flash,gpt2-codegolf,563.656472,False,0.0,False,563.656472 +ff0f19ea-58f9-40d2-8a69-eb756626c9ed,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,openssl-selfsigned-cert,3846,2516,6362,181.191757,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,openssl-selfsigned-cert,181.191757,False,0.4,False,181.191757 +76ab802c-6b26-4ea4-b150-61ae2d8e1a36,grok-4-0709,xai,path-tracing,3982,3187,7169,1860.298814,False,0.0,grok-4-0709,path-tracing,1860.298814,False,0.0,False,1860.298814 +5cb189ea-a335-41c5-aeb2-a025021a6aae,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,constraints-scheduling,5949,4396,10345,391.861958,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,constraints-scheduling,391.861958,True,1.0,True,391.861958 +3be4d6fa-1851-4b67-ae8f-2f5fdd5b496e,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,distribution-search,7467,5810,13277,2071.035792,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,distribution-search,2071.035792,False,0.0,False,2071.035792 +b5e793d0-8715-420f-a90b-a7c1cf8cec6a,gpt-5,openai,largest-eigenval,8588,7202,15790,725.332873,False,0.0,gpt-5,largest-eigenval,725.332873,False,0.0,False,725.332873 +1f312ef1-eb47-4a2c-bd3e-73e67b672605,claude-opus-4-1-20250805,anthropic,count-dataset-tokens,12352,2475,14827,306.541506,False,0.0,claude-opus-4-1-20250805,count-dataset-tokens,306.541506,False,0.0,False,306.541506 +dd3f0803-762c-4bb7-a858-de4dec4dd99e,zai-org/GLM-4.5-Air-FP8,together_ai,dna-assembly,18182,7560,25742,721.467656,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-assembly,721.467656,False,0.0,False,721.467656 +06c76a95-74e3-4d5c-adb3-81dcd76bca94,zai-org/GLM-4.5-Air-FP8,together_ai,tune-mjcf,9452,10448,19900,1006.430859,False,0.0,zai-org/GLM-4.5-Air-FP8,tune-mjcf,1006.430859,False,0.0,False,1006.430859 +30451bf1-2fdc-42ae-8c04-d97cabf911d8,gpt-5,openai,reshard-c4-data,1781,4730,6511,388.870852,True,1.0,gpt-5,reshard-c4-data,388.870852,True,0.3333333333333333,True,388.870852 +4972d768-75e8-4e91-ab75-f65fe5b0eb43,zai-org/GLM-4.5-Air-FP8,together_ai,train-fasttext,24663,10895,35558,2870.975858,True,1.0,zai-org/GLM-4.5-Air-FP8,train-fasttext,2870.975858,True,0.2,True,2870.975858 +27fdaa4e-3636-4e9c-b53a-51d99fb32f46,zai-org/GLM-4.5-Air-FP8,together_ai,dna-insert,13146,3904,17050,361.682963,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-insert,361.682963,False,0.0,False,361.682963 +8a684b88-63bb-4b0a-b5b4-0ef90a464515,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sparql-university,11601,3047,14648,330.063359,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sparql-university,330.063359,False,0.0,False,330.063359 +38d9a557-1971-44a5-8cad-88d2169cbc85,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-leaderboard,8301,8815,17116,2124.028368,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-leaderboard,2124.028368,False,0.0,False,2124.028368 +0701bd50-d081-4d54-941e-570a9d051743,zai-org/GLM-4.5-Air-FP8,together_ai,git-leak-recovery,3133,4397,7530,109.87425,True,1.0,zai-org/GLM-4.5-Air-FP8,git-leak-recovery,109.87425,True,0.8,True,109.87425 +b557d6c8-aaa1-445d-b152-788af54e5051,claude-opus-4-1-20250805,anthropic,nginx-request-logging,4968,1870,6838,233.265661,True,1.0,claude-opus-4-1-20250805,nginx-request-logging,233.265661,True,1.0,True,233.265661 +27d7ccc7-7795-45a2-85aa-3e3d4ac91d6e,openai/gpt-oss-120b,together_ai,git-leak-recovery,1186,1178,2364,72.803329,False,0.0,openai/gpt-oss-120b,git-leak-recovery,72.803329,False,0.2,False,72.803329 +183a1834-b322-401c-a75d-c458788d00a9,claude-sonnet-4-20250514,anthropic,polyglot-rust-c,9770,10848,20618,900.535424,False,0.0,claude-sonnet-4-20250514,polyglot-rust-c,900.535424,False,0.0,False,900.535424 +c0d80f87-7f30-487a-b3e2-5766600f742f,gpt-5,openai,code-from-image,24219,7894,32113,567.152112,True,1.0,gpt-5,code-from-image,567.152112,True,0.4,True,567.152112 +6e6f8980-02c0-4217-8bce-89647196b466,zai-org/GLM-4.5-Air-FP8,together_ai,form-filling,6106,5729,11835,371.876728,True,1.0,zai-org/GLM-4.5-Air-FP8,form-filling,371.876728,True,0.8,True,371.876728 +259414e9-193c-440f-9f29-b462489cd762,moonshotai/Kimi-K2-Instruct-0905,together_ai,largest-eigenval,6632,5752,12384,910.658507,False,0.0,moonshotai/Kimi-K2-Instruct-0905,largest-eigenval,910.658507,False,0.2,False,910.658507 +4a120157-5af1-4313-9897-288c67b8d002,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,financial-document-processor,10877,2031,12908,641.888099,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,financial-document-processor,641.888099,False,0.0,False,641.888099 +2be54584-afd4-4ae8-add6-38e332bbf922,claude-opus-4-1-20250805,anthropic,path-tracing-reverse,33858,25748,59606,1810.128392,False,0.0,claude-opus-4-1-20250805,path-tracing-reverse,1810.128392,False,0.0,False,1810.128392 +4d89ef5c-73d5-424e-8e70-5aaa54ca72be,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pov-ray,13214,6376,19590,974.964822,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pov-ray,974.964822,False,0.2,False,974.964822 +9aef684a-e4bd-405a-9932-d4ca61213515,OpenAI/gpt-oss-20B,together_ai,sqlite-with-gcov,3386,17313,20699,911.820457,False,0.0,OpenAI/gpt-oss-20B,sqlite-with-gcov,911.820457,False,0.0,False,911.820457 +c7d2275b-eda7-4853-884c-24d599ad6089,deepseek-ai/DeepSeek-V3.1,together_ai,reverse-engineering,11383,6954,18337,513.760676,False,0.0,deepseek-ai/DeepSeek-V3.1,reverse-engineering,513.760676,False,0.2,False,513.760676 +3d272d79-ba69-4495-b298-831b4c4ce340,zai-org/GLM-4.5-Air-FP8,together_ai,bn-fit-modify,19723,12254,31977,657.684522,False,0.0,zai-org/GLM-4.5-Air-FP8,bn-fit-modify,657.684522,False,0.0,False,657.684522 +fd489c11-113e-4ee8-8d43-c1f7cdb44481,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,configure-git-webserver,6527,2196,8723,434.918866,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,configure-git-webserver,434.918866,True,0.6,True,434.918866 +b7d75e8f-c633-4f53-98d9-e27efa6b0f9e,gemini-2.5-flash,gemini,configure-git-webserver,5634,1792,7426,437.069834,False,0.0,gemini-2.5-flash,configure-git-webserver,437.069834,False,0.0,False,437.069834 +1d5bee34-f592-45be-aadb-8c81bc0d8f11,grok-4-0709,xai,qemu-startup,1920,2867,4787,902.780115,False,0.0,grok-4-0709,qemu-startup,902.780115,False,0.4,False,902.780115 +8fc5545b-8b8e-4763-9d14-dea0c3e11c17,claude-opus-4-1-20250805,anthropic,train-fasttext,53986,17299,71285,3605.320573,False,0.0,claude-opus-4-1-20250805,train-fasttext,3605.320573,False,0.2857142857142857,False,3605.320573 +9a6f79a5-5447-4a34-b6a6-5d8f9d20672d,gemini-2.5-flash,gemini,run-pdp11-code,8946,13572,22518,848.854832,False,0.0,gemini-2.5-flash,run-pdp11-code,848.854832,False,0.0,False,848.854832 +c27b65a0-4c91-4f6f-b501-82382ebc4d8d,gpt-5-mini,openai,chess-best-move,16681,7413,24094,652.434609,False,0.0,gpt-5-mini,chess-best-move,652.434609,False,0.0,False,652.434609 +5fc11512-4b0e-4eb5-8313-398638a6adac,gemini-2.5-pro,gemini,merge-diff-arc-agi-task,8379,2876,11255,255.241637,True,1.0,gemini-2.5-pro,merge-diff-arc-agi-task,255.241637,True,0.6,True,255.241637 +f8029e1d-ab53-4c8a-ac08-ea484c216b11,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-insert,8210,7801,16011,302.344501,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-insert,302.344501,False,0.0,False,302.344501 +c879060f-a87f-417c-a6a9-5664e8ad0470,grok-code-fast-1,xai,bn-fit-modify,13860,7786,21646,1031.690114,False,0.0,grok-code-fast-1,bn-fit-modify,1031.690114,False,0.0,False,1031.690114 +c61ad51e-9a6c-4085-94fb-66925868beba,OpenAI/gpt-oss-20B,together_ai,hf-model-inference,6931,16686,23617,905.219522,False,0.0,OpenAI/gpt-oss-20B,hf-model-inference,905.219522,False,0.4,False,905.219522 +76ffc68f-298c-4a17-9af8-2ebf6764985a,openai/gpt-oss-120b,together_ai,fix-ocaml-gc,29280,10803,40083,3617.420311,False,0.0,openai/gpt-oss-120b,fix-ocaml-gc,3617.420311,False,0.0,False,3617.420311 +ce97982a-1375-43c8-bf2b-c1426de2a205,grok-4-0709,xai,build-pov-ray,16963,7472,24435,1882.814736,True,1.0,grok-4-0709,build-pov-ray,1882.814736,True,1.0,True,1882.814736 +9c0c3e00-8bfc-4b18-9d4d-7e7ff6ab1ee1,deepseek-ai/DeepSeek-V3.1,together_ai,run-pdp11-code,21437,10641,32078,1000.335696,False,0.0,deepseek-ai/DeepSeek-V3.1,run-pdp11-code,1000.335696,False,0.0,False,1000.335696 +3c935d1f-0e21-4915-a0f0-c864c86cc4ff,gpt-5-nano,openai,sanitize-git-repo,5198,4821,10019,405.671443,False,0.0,gpt-5-nano,sanitize-git-repo,405.671443,False,0.0,False,405.671443 +47e67633-e960-482e-a45a-b5f5f78a8387,OpenAI/gpt-oss-20B,together_ai,winning-avg-corewars,807,1478,2285,231.737965,False,0.0,OpenAI/gpt-oss-20B,winning-avg-corewars,231.737965,False,0.0,False,231.737965 +9069b432-4864-445c-97a0-9e3bfd53b36d,claude-opus-4-1-20250805,anthropic,qemu-startup,7168,5409,12577,397.317461,False,0.0,claude-opus-4-1-20250805,qemu-startup,397.317461,False,0.4285714285714285,False,397.317461 +e55d2084-c51a-4e7f-9d8c-130f8da953dc,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,circuit-fibsqrt,30496,34014,64510,3600.050767,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,circuit-fibsqrt,3600.050767,False,0.0,False,3600.050767 +ee1c65b2-caaf-4e4d-81bd-bb2e7cba0ca4,moonshotai/Kimi-K2-Instruct-0905,together_ai,sanitize-git-repo,4299,990,5289,1005.461702,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sanitize-git-repo,1005.461702,False,0.0,False,1005.461702 +a8c7dbe8-7902-4f99-a666-1e13c78fde02,deepseek-ai/DeepSeek-V3.1,together_ai,wasm-pipeline,8699,8973,17672,323.960896,False,0.0,deepseek-ai/DeepSeek-V3.1,wasm-pipeline,323.960896,False,0.4,False,323.960896 +5a788267-8374-4452-a3a3-795d9b0061e7,deepseek-ai/DeepSeek-V3.1,together_ai,model-extraction-relu-logits,23776,21791,45567,798.141034,False,0.0,deepseek-ai/DeepSeek-V3.1,model-extraction-relu-logits,798.141034,False,0.2,False,798.141034 +da84d717-2fc7-4902-99a5-70ebcdc7056a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing,4406,4018,8424,320.513078,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing,320.513078,False,0.0,False,320.513078 +db1d9636-215f-4977-930e-937bbc1f6a65,gemini-2.5-flash,gemini,pytorch-model-cli,2525,2004,4529,107.20064,False,0.0,gemini-2.5-flash,pytorch-model-cli,107.20064,False,0.0,False,107.20064 +7ddc7bbe-58aa-472c-a4ec-ee7e06259bbc,gpt-5,openai,model-extraction-relu-logits,3195,3073,6268,137.309111,True,1.0,gpt-5,model-extraction-relu-logits,137.309111,True,0.1666666666666666,True,137.309111 +48a3250a-06f8-40df-9618-990fccea3ef8,gpt-5,openai,vulnerable-secret,2890,2985,5875,920.045444,False,0.0,gpt-5,vulnerable-secret,920.045444,False,0.2857142857142857,False,920.045444 +ab13dc61-78ac-4385-959a-74ca8e55d71b,claude-opus-4-1-20250805,anthropic,prove-plus-comm,1802,1154,2956,49.434102,True,1.0,claude-opus-4-1-20250805,prove-plus-comm,49.434102,True,1.0,True,49.434102 +334a7b50-49b5-4f5e-a239-f27ec1039d41,grok-code-fast-1,xai,crack-7z-hash,18153,3772,21925,916.788392,False,0.0,grok-code-fast-1,crack-7z-hash,916.788392,False,0.6,False,916.788392 +80dddf7a-6565-427e-916e-944b3f47539b,gemini-2.5-pro,gemini,install-klee-minimal,20159,2572,22731,900.390169,False,0.0,gemini-2.5-pro,install-klee-minimal,900.390169,False,0.0,False,900.390169 +1207a56c-016c-47e9-ab6d-45cf538b7af8,gpt-5-mini,openai,feal-linear-cryptanalysis,24247,17217,41464,1800.967376,False,0.0,gpt-5-mini,feal-linear-cryptanalysis,1800.967376,False,0.0,False,1800.967376 +6497829f-8449-4139-94c7-0a2c47b7883a,gpt-5-mini,openai,port-compressor,17235,21920,39155,3618.376007,False,0.0,gpt-5-mini,port-compressor,3618.376007,False,0.0,False,3618.376007 +4494f62e-961f-4455-80f3-89d9c1c9c10c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,merge-diff-arc-agi-task,11485,4838,16323,900.244142,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,merge-diff-arc-agi-task,900.244142,False,0.0,False,900.244142 +41dcdcd6-a2ae-43ae-9714-8ad88799b586,gpt-5,openai,constraints-scheduling,3550,1633,5183,265.556712,True,1.0,gpt-5,constraints-scheduling,265.556712,True,0.8571428571428571,True,265.556712 +9c3f8abf-d5d2-4983-9ca7-877008d5ec55,gpt-5-nano,openai,mteb-retrieve,7248,11440,18688,1818.220261,False,0.0,gpt-5-nano,mteb-retrieve,1818.220261,False,0.0,False,1818.220261 +feaf761c-261a-4830-9346-a5382bcfe348,gpt-5-mini,openai,financial-document-processor,3824,4323,8147,200.88557,False,0.0,gpt-5-mini,financial-document-processor,200.88557,False,0.0,False,200.88557 +9fc225d5-3115-4f43-b789-cf2a7508f53e,openai/gpt-oss-120b,together_ai,install-klee-minimal,4578,2467,7045,900.162637,False,0.0,openai/gpt-oss-120b,install-klee-minimal,900.162637,False,0.0,False,900.162637 +d416f3de-255b-485a-a1c0-3bbbcb6a9ee1,claude-sonnet-4-20250514,anthropic,dna-insert,12122,7316,19438,365.448887,False,0.0,claude-sonnet-4-20250514,dna-insert,365.448887,False,0.0,False,365.448887 +efef8e61-e0b6-47d5-9fd6-e906cf9f8d5e,gemini-2.5-flash,gemini,dna-insert,8413,1474,9887,366.968483,False,0.0,gemini-2.5-flash,dna-insert,366.968483,False,0.0,False,366.968483 +4bef9563-e93d-4b88-bf3d-bfacb401ef98,gpt-5-mini,openai,cobol-modernization,7469,3918,11387,324.869764,True,1.0,gpt-5-mini,cobol-modernization,324.869764,True,1.0,True,324.869764 +95c37ddd-ff69-46a6-a666-18b591f41a7c,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,filter-js-from-html,4373,4292,8665,403.638001,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,filter-js-from-html,403.638001,False,0.0,False,403.638001 +97e28987-629e-4208-8547-62524dd7084d,deepseek-ai/DeepSeek-V3.1,together_ai,sanitize-git-repo,12669,3039,15708,509.294057,False,0.0,deepseek-ai/DeepSeek-V3.1,sanitize-git-repo,509.294057,False,0.0,False,509.294057 +22f4265a-71d9-4535-afe9-34615065d4ab,zai-org/GLM-4.5-Air-FP8,together_ai,vulnerable-secret,24194,10206,34400,906.501625,False,0.0,zai-org/GLM-4.5-Air-FP8,vulnerable-secret,906.501625,False,0.0,False,906.501625 +1ddf7e9c-7a29-4b40-8935-39f3c02f10cc,openai/gpt-oss-120b,together_ai,schemelike-metacircular-eval,31604,47142,78746,2400.033948,False,0.0,openai/gpt-oss-120b,schemelike-metacircular-eval,2400.033948,False,0.0,False,2400.033948 +444230cf-b35b-4c74-ba14-dd6ebbd853c9,claude-opus-4-1-20250805,anthropic,code-from-image,17379,16856,34235,1202.099865,False,0.0,claude-opus-4-1-20250805,code-from-image,1202.099865,False,0.125,False,1202.099865 +a96d27af-d2b1-452c-9fcb-b0139e76c7ea,gemini-2.5-flash,gemini,mteb-retrieve,9544,3406,12950,229.928467,False,0.0,gemini-2.5-flash,mteb-retrieve,229.928467,False,0.0,False,229.928467 +7e21ae14-e04c-4f63-a7cf-836fbacf25d6,deepseek-ai/DeepSeek-V3.1,together_ai,crack-7z-hash,9016,3509,12525,435.919866,False,0.0,deepseek-ai/DeepSeek-V3.1,crack-7z-hash,435.919866,False,0.8,False,435.919866 +9af0b005-a364-4e67-822f-8c7e23911e9f,claude-sonnet-4-20250514,anthropic,filter-js-from-html,9112,7103,16215,755.653321,False,0.0,claude-sonnet-4-20250514,filter-js-from-html,755.653321,False,0.0,False,755.653321 +18603003-dfaa-4b0c-bf90-27e91925acc7,gpt-5-mini,openai,hf-model-inference,3827,1720,5547,339.060156,True,1.0,gpt-5-mini,hf-model-inference,339.060156,True,0.8,True,339.060156 +2bd62ac0-fae2-40c2-8a7a-1812094ce5c5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,password-recovery,2513,2001,4514,136.873587,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,password-recovery,136.873587,False,0.0,False,136.873587 +6d86d0f1-1bd9-41f4-85e7-8bb7cc70fb53,gpt-5,openai,pytorch-model-recovery,8535,7784,16319,370.610594,True,1.0,gpt-5,pytorch-model-recovery,370.610594,True,0.4285714285714285,True,370.610594 +bbbc214a-913a-4840-a2ad-ca3a8746561b,openai/gpt-oss-120b,together_ai,tune-mjcf,9061,9078,18139,907.71481,False,0.0,openai/gpt-oss-120b,tune-mjcf,907.71481,False,0.2,False,907.71481 +e0b54c21-7a19-4106-87a2-4c9bdd9882ce,openai/gpt-oss-120b,together_ai,feal-linear-cryptanalysis,8378,5680,14058,210.976295,True,1.0,openai/gpt-oss-120b,feal-linear-cryptanalysis,210.976295,True,0.4,True,210.976295 +6e98b0d7-c3a4-4e48-9b46-c304e7f92aab,gpt-5,openai,distribution-search,4911,3815,8726,450.929963,True,1.0,gpt-5,distribution-search,450.929963,True,1.0,True,450.929963 +49ec91e7-60fb-4f0d-b6e1-68567f5f90ab,claude-sonnet-4-20250514,anthropic,sparql-university,8987,4190,13177,595.466802,False,0.0,claude-sonnet-4-20250514,sparql-university,595.466802,False,0.0,False,595.466802 +dc75b0aa-b489-438f-b107-4bfe4a68973c,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cancel-async-tasks,2361,2079,4440,900.626118,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cancel-async-tasks,900.626118,True,0.6,True,900.626118 +0f9ff584-d3a6-47c9-b8c8-865b1666693d,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pypi-server,5520,1717,7237,359.145954,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pypi-server,359.145954,False,0.2,False,359.145954 +7f3496a1-13ee-415c-8157-2359add0aa30,gpt-5,openai,torch-tensor-parallelism,3619,5472,9091,366.392131,False,0.0,gpt-5,torch-tensor-parallelism,366.392131,False,0.0,False,366.392131 +28813d60-6bf7-48c0-b48b-2ff82aebd76f,gemini-2.5-pro,gemini,nginx-request-logging,3745,1273,5018,105.732398,True,1.0,gemini-2.5-pro,nginx-request-logging,105.732398,True,0.6,True,105.732398 +b7a1be39-8872-4fed-b9c7-bcdddc372a93,grok-4-0709,xai,extract-elf,2649,1224,3873,455.43338,False,0.0,grok-4-0709,extract-elf,455.43338,False,0.2,False,455.43338 +517c2497-6f85-4980-a42e-8c6f39328a4f,gemini-2.5-pro,gemini,merge-diff-arc-agi-task,7920,2299,10219,919.659348,True,1.0,gemini-2.5-pro,merge-diff-arc-agi-task,919.659348,True,0.6,True,919.659348 +d0a47b4a-6eff-422f-ad93-b6a7a215b0e7,gpt-5,openai,install-klee-minimal,1817,1889,3706,900.064479,False,0.0,gpt-5,install-klee-minimal,900.064479,False,0.0,False,900.064479 +621655c2-b7af-40db-a72e-cb970121a00a,gpt-5-nano,openai,path-tracing,3859,3172,7031,198.459098,False,0.0,gpt-5-nano,path-tracing,198.459098,False,0.2,False,198.459098 +dc624d64-5e20-4aff-ad4e-d45030dfba95,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,break-filter-js-from-html,8849,11079,19928,1101.209751,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,break-filter-js-from-html,1101.209751,False,0.0,False,1101.209751 +2533a021-8594-429f-a203-99bcf8485608,zai-org/GLM-4.5-Air-FP8,together_ai,filter-js-from-html,17196,18568,35764,805.143316,False,0.0,zai-org/GLM-4.5-Air-FP8,filter-js-from-html,805.143316,False,0.0,False,805.143316 +3984abde-a929-4da4-8b97-2d5d94c2b6c6,moonshotai/Kimi-K2-Instruct-0905,together_ai,chess-best-move,9284,8149,17433,471.861006,False,0.0,moonshotai/Kimi-K2-Instruct-0905,chess-best-move,471.861006,False,0.0,False,471.861006 +0294ef5b-3b04-4640-a9ed-dbc7bd635c20,OpenAI/gpt-oss-20B,together_ai,make-doom-for-mips,1055,1900,2955,1001.54888,False,0.0,OpenAI/gpt-oss-20B,make-doom-for-mips,1001.54888,False,0.0,False,1001.54888 +be6cf86b-4f26-4f55-b971-cf2c087f8727,gpt-5-mini,openai,schemelike-metacircular-eval,20910,18871,39781,2428.968544,False,0.0,gpt-5-mini,schemelike-metacircular-eval,2428.968544,False,0.0,False,2428.968544 +bed85c80-9363-4acf-849f-5369fe2221d4,gemini-2.5-flash,gemini,pytorch-model-recovery,10309,14489,24798,903.391383,False,0.0,gemini-2.5-flash,pytorch-model-recovery,903.391383,False,0.2,False,903.391383 +9d4f126a-1f1d-4a75-8c9d-a0ac12c9b84b,zai-org/GLM-4.5-Air-FP8,together_ai,write-compressor,9657,8952,18609,1033.294118,False,0.0,zai-org/GLM-4.5-Air-FP8,write-compressor,1033.294118,False,0.0,False,1033.294118 +2edfe09c-c286-49d1-962e-efa450cccca0,claude-opus-4-1-20250805,anthropic,model-extraction-relu-logits,6408,4750,11158,182.227921,False,0.0,claude-opus-4-1-20250805,model-extraction-relu-logits,182.227921,False,0.0,False,182.227921 +2167e733-500c-45aa-9997-cad189d45c77,gpt-5-mini,openai,openssl-selfsigned-cert,2534,2291,4825,149.276407,True,1.0,gpt-5-mini,openssl-selfsigned-cert,149.276407,True,0.8,True,149.276407 +6d607abd-05fd-4082-b28a-1135da5b0691,gpt-5-nano,openai,feal-differential-cryptanalysis,5233,5865,11098,657.022342,False,0.0,gpt-5-nano,feal-differential-cryptanalysis,657.022342,False,0.0,False,657.022342 +5ef428bd-2533-4283-95f8-2cece4c55e0b,grok-4-0709,xai,sparql-university,4943,1257,6200,386.212565,True,1.0,grok-4-0709,sparql-university,386.212565,True,0.4,True,386.212565 +3d0a4824-e96e-4fa6-a694-344abeb3c8ad,deepseek-ai/DeepSeek-V3.1,together_ai,openssl-selfsigned-cert,4495,3563,8058,219.22409,True,1.0,deepseek-ai/DeepSeek-V3.1,openssl-selfsigned-cert,219.22409,True,1.0,True,219.22409 +96a8d27a-2b18-4290-b066-e003696f4a34,gpt-5,openai,prove-plus-comm,2401,1474,3875,219.044767,True,1.0,gpt-5,prove-plus-comm,219.044767,True,0.8571428571428571,True,219.044767 +e0cd8363-037c-4c37-9209-47a1ff78067d,claude-sonnet-4-20250514,anthropic,make-doom-for-mips,16801,5684,22485,908.84883,False,0.0,claude-sonnet-4-20250514,make-doom-for-mips,908.84883,False,0.0,False,908.84883 +8ce8262e-647f-4f46-9120-2f75ca722077,claude-opus-4-1-20250805,anthropic,extract-elf,5840,3659,9499,132.109921,True,1.0,claude-opus-4-1-20250805,extract-elf,132.109921,True,0.8888888888888888,True,132.109921 +5cd2324a-63e5-4417-9edc-755ac39359d3,claude-opus-4-1-20250805,anthropic,adaptive-rejection-sampler,4901,7274,12175,947.652979,False,0.0,claude-opus-4-1-20250805,adaptive-rejection-sampler,947.652979,False,0.125,False,947.652979 +aaf3fe24-154a-47da-afd1-23768c05d30e,moonshotai/Kimi-K2-Instruct-0905,together_ai,financial-document-processor,12673,7081,19754,650.56219,False,0.0,moonshotai/Kimi-K2-Instruct-0905,financial-document-processor,650.56219,False,0.0,False,650.56219 +86934fd0-337b-47b4-9004-ed4041dcb44a,gemini-2.5-flash,gemini,make-doom-for-mips,26194,7826,34020,900.553414,False,0.0,gemini-2.5-flash,make-doom-for-mips,900.553414,False,0.0,False,900.553414 +4d0065a9-4aa6-411b-8936-449279085253,grok-code-fast-1,xai,dna-insert,962,436,1398,368.980774,False,0.0,grok-code-fast-1,dna-insert,368.980774,False,0.0,False,368.980774 +81e43f3a-062a-4da3-9460-0848453b8b02,grok-4-0709,xai,polyglot-c-py,1209,631,1840,488.151746,True,1.0,grok-4-0709,polyglot-c-py,488.151746,True,0.6,True,488.151746 +fd49775d-337b-4213-86d0-f821857e7099,moonshotai/Kimi-K2-Instruct-0905,together_ai,extract-elf,9328,6566,15894,555.879275,False,0.0,moonshotai/Kimi-K2-Instruct-0905,extract-elf,555.879275,False,0.6,False,555.879275 +f569ab9b-964a-4a0d-a1e8-dd50f8327ff4,gemini-2.5-flash,gemini,reshard-c4-data,6789,7517,14306,338.965268,False,0.0,gemini-2.5-flash,reshard-c4-data,338.965268,False,0.0,False,338.965268 +c4d34cee-3c07-42c1-a333-aa5b92c0b7a9,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sanitize-git-repo,7550,3446,10996,566.58534,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sanitize-git-repo,566.58534,False,0.0,False,566.58534 +8b907b58-54b4-4dcc-a0ee-d64b91e12c1e,claude-opus-4-1-20250805,anthropic,db-wal-recovery,11231,5746,16977,587.430964,False,0.0,claude-opus-4-1-20250805,db-wal-recovery,587.430964,False,0.0,False,587.430964 +0afcfa0b-7968-4c38-b0ec-90c0a0c96859,claude-opus-4-1-20250805,anthropic,constraints-scheduling,4972,2923,7895,86.497593,True,1.0,claude-opus-4-1-20250805,constraints-scheduling,86.497593,True,0.8888888888888888,True,86.497593 +a9753015-2283-4eca-b470-cf84e34091b5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sparql-university,2549,1194,3743,57.438985,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sparql-university,57.438985,False,0.0,False,57.438985 +f7854252-a966-49af-bc48-fbaf7ca73a72,deepseek-ai/DeepSeek-V3.1,together_ai,make-mips-interpreter,15923,20627,36550,1800.93035,False,0.0,deepseek-ai/DeepSeek-V3.1,make-mips-interpreter,1800.93035,False,0.0,False,1800.93035 +949cd74a-c571-4201-a276-5a1accf20e0e,gemini-2.5-pro,gemini,model-extraction-relu-logits,4077,3142,7219,379.072137,False,0.0,gemini-2.5-pro,model-extraction-relu-logits,379.072137,False,0.0,False,379.072137 +f8300148-1fe7-4dde-a160-426aea23a040,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,break-filter-js-from-html,8748,11004,19752,1220.476872,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,break-filter-js-from-html,1220.476872,False,0.0,False,1220.476872 +70dbedd7-20e1-40bf-bda0-aaa50480231b,gpt-5-nano,openai,nginx-request-logging,4699,3911,8610,1024.089891,False,0.0,gpt-5-nano,nginx-request-logging,1024.089891,False,0.0,False,1024.089891 +6b194578-73b4-4f05-b022-f752e1852cac,claude-sonnet-4-20250514,anthropic,log-summary-date-ranges,8990,3970,12960,249.15373,True,1.0,claude-sonnet-4-20250514,log-summary-date-ranges,249.15373,True,1.0,True,249.15373 +47a204fe-4d6d-4bd1-972a-af0702c21f5d,gpt-5-mini,openai,torch-tensor-parallelism,2815,2318,5133,116.723887,False,0.0,gpt-5-mini,torch-tensor-parallelism,116.723887,False,0.0,False,116.723887 +c78ac0ac-4e2f-459b-9de1-32abcd268740,OpenAI/gpt-oss-20B,together_ai,sparql-university,522,1141,1663,335.482886,False,0.0,OpenAI/gpt-oss-20B,sparql-university,335.482886,False,0.0,False,335.482886 +16c5def7-83a1-42b7-9ffb-d7065da572e0,openai/gpt-oss-120b,together_ai,crack-7z-hash,10145,3628,13773,335.898885,False,0.0,openai/gpt-oss-120b,crack-7z-hash,335.898885,False,0.0,False,335.898885 +b640f0d1-80dd-433e-a775-a32107ab13d4,gpt-5-nano,openai,dna-insert,6850,5703,12553,367.3831,False,0.0,gpt-5-nano,dna-insert,367.3831,False,0.0,False,367.3831 +b58be45c-0809-467d-8110-458d5c47422f,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,wasm-pipeline,16269,5443,21712,541.587887,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,wasm-pipeline,541.587887,False,0.0,False,541.587887 +10d932ef-09b3-448a-9137-c0d41d9768f0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,largest-eigenval,2202,1611,3813,907.779643,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,largest-eigenval,907.779643,False,0.2,False,907.779643 +c068bfa3-5ca2-409c-999a-0d811c6ac76a,gemini-2.5-pro,gemini,circuit-fibsqrt,12006,13747,25753,1048.719121,False,0.0,gemini-2.5-pro,circuit-fibsqrt,1048.719121,False,0.0,False,1048.719121 +0e3d4498-59bb-493e-8c80-c890826a51b7,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,crack-7z-hash,20740,6391,27131,910.169873,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,crack-7z-hash,910.169873,False,0.0,False,910.169873 +e494e657-f427-4915-b6c0-5afa96fa3d07,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,openssl-selfsigned-cert,2500,1697,4197,78.41501,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,openssl-selfsigned-cert,78.41501,False,0.0,False,78.41501 +5a8c6cab-5d2b-4a51-9459-61dc03cd3c1f,grok-code-fast-1,xai,password-recovery,3756,3810,7566,393.118825,False,0.0,grok-code-fast-1,password-recovery,393.118825,False,0.0,False,393.118825 +40f175e0-41c0-4ece-bd2d-c362337fe1a1,grok-code-fast-1,xai,install-klee-minimal,10829,2718,13547,900.032245,False,0.0,grok-code-fast-1,install-klee-minimal,900.032245,False,0.0,False,900.032245 +d8e453c2-2891-4f35-a246-a52b6e246ca1,claude-sonnet-4-20250514,anthropic,pytorch-model-recovery,5758,4369,10127,281.056262,True,1.0,claude-sonnet-4-20250514,pytorch-model-recovery,281.056262,True,1.0,True,281.056262 +2303fae9-8cbf-4cb4-8140-a50cbbb4e319,gemini-2.5-pro,gemini,build-pov-ray,35999,11491,47490,3241.614184,True,1.0,gemini-2.5-pro,build-pov-ray,3241.614184,True,1.0,True,3241.614184 +bbd68584-8d73-4538-a6e8-0b466cb4dabf,OpenAI/gpt-oss-20B,together_ai,fix-ocaml-gc,2851,1258,4109,189.782575,False,0.0,OpenAI/gpt-oss-20B,fix-ocaml-gc,189.782575,False,0.0,False,189.782575 +88ff674f-519b-4fa9-9836-9c8cddedf725,gpt-5-mini,openai,feal-linear-cryptanalysis,7522,5464,12986,670.06386,False,0.0,gpt-5-mini,feal-linear-cryptanalysis,670.06386,False,0.0,False,670.06386 +a4f7e7ac-78e2-4161-ba82-d948d89f8808,deepseek-ai/DeepSeek-V3.1,together_ai,db-wal-recovery,1920,1967,3887,924.011394,False,0.0,deepseek-ai/DeepSeek-V3.1,db-wal-recovery,924.011394,False,0.0,False,924.011394 +325d2035-375b-4b45-a702-330cd8554324,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,port-compressor,34797,13409,48206,3613.524651,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,port-compressor,3613.524651,False,0.0,False,3613.524651 +5a265616-32cd-42ad-a8d4-896899dd9b88,claude-opus-4-1-20250805,anthropic,pytorch-model-recovery,7334,4580,11914,902.330004,True,1.0,claude-opus-4-1-20250805,pytorch-model-recovery,902.330004,True,1.0,True,902.330004 +70aa9ff5-6468-4b8f-b109-ba5ffcc1259b,grok-4-0709,xai,circuit-fibsqrt,4466,3145,7611,2062.591725,False,0.0,grok-4-0709,circuit-fibsqrt,2062.591725,False,0.0,False,2062.591725 +93fc19f0-eb37-45e7-8f75-9dd3ee395ad5,moonshotai/Kimi-K2-Instruct-0905,together_ai,sparql-university,6600,3512,10112,244.127457,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sparql-university,244.127457,False,0.0,False,244.127457 +007a88ca-44bb-421a-bb4a-039c5eb8cd68,gemini-2.5-pro,gemini,bn-fit-modify,32847,13846,46693,3511.16303,False,0.0,gemini-2.5-pro,bn-fit-modify,3511.16303,False,0.0,False,3511.16303 +c183ee83-708e-428f-8b5e-b337a716dd1c,moonshotai/Kimi-K2-Instruct-0905,together_ai,tune-mjcf,8321,9136,17457,900.378612,False,0.0,moonshotai/Kimi-K2-Instruct-0905,tune-mjcf,900.378612,False,0.4,False,900.378612 +8e6a5074-9071-4c97-aed6-4f2aeb388de6,gemini-2.5-pro,gemini,polyglot-rust-c,4472,5106,9578,909.72141,False,0.0,gemini-2.5-pro,polyglot-rust-c,909.72141,False,0.0,False,909.72141 +74885a5e-6fd5-4003-974b-776be6047c09,gpt-5-mini,openai,git-leak-recovery,1896,1882,3778,238.546245,False,0.0,gpt-5-mini,git-leak-recovery,238.546245,False,0.0,False,238.546245 +f5d30300-ef64-4314-a244-eca820e84e93,gemini-2.5-pro,gemini,nginx-request-logging,4727,1298,6025,177.69263,True,1.0,gemini-2.5-pro,nginx-request-logging,177.69263,True,0.6,True,177.69263 +b66f4645-bfb8-45db-969a-bf08859155f2,gpt-5-mini,openai,polyglot-c-py,4562,2954,7516,900.386915,False,0.0,gpt-5-mini,polyglot-c-py,900.386915,False,0.0,False,900.386915 +50b51e0d-10d2-42c8-9acf-97eada281776,openai/gpt-oss-120b,together_ai,mteb-retrieve,1712,621,2333,46.369117,False,0.0,openai/gpt-oss-120b,mteb-retrieve,46.369117,False,0.0,False,46.369117 +05199fa2-cc1e-4201-bae0-6bf937da1b3c,gemini-2.5-pro,gemini,reshard-c4-data,7190,3217,10407,514.007344,False,0.0,gemini-2.5-pro,reshard-c4-data,514.007344,False,0.0,False,514.007344 +3b1899c8-d1de-4339-8075-b83647c72bca,gpt-5-nano,openai,fix-git,4098,3097,7195,944.405087,False,0.0,gpt-5-nano,fix-git,944.405087,False,0.0,False,944.405087 +87e81dc7-3412-4fa2-aeaf-24262ad9255a,gpt-5,openai,password-recovery,8816,7292,16108,900.001847,False,0.0,gpt-5,password-recovery,900.001847,False,0.0,False,900.001847 +3be62b55-b5fc-4363-85db-44fb31833124,gemini-2.5-pro,gemini,mteb-retrieve,2245,1364,3609,379.667864,False,0.0,gemini-2.5-pro,mteb-retrieve,379.667864,False,0.0,False,379.667864 +3de7e646-8d0e-4e5d-b101-8fe9ed95c696,gpt-5-nano,openai,fix-git,3736,1391,5127,161.950019,False,0.0,gpt-5-nano,fix-git,161.950019,False,0.0,False,161.950019 +650e0956-5a92-4842-a328-db3dd871c31c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,extract-elf,3400,2835,6235,175.25702,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,extract-elf,175.25702,False,0.0,False,175.25702 +0fc04776-bb22-4e43-8c1c-8d0394ef5b4e,claude-sonnet-4-20250514,anthropic,torch-tensor-parallelism,3130,2004,5134,94.305263,False,0.0,claude-sonnet-4-20250514,torch-tensor-parallelism,94.305263,False,0.0,False,94.305263 +18dcde71-014b-4085-95fe-54390c344185,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-leaderboard,9581,2160,11741,1869.325197,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-leaderboard,1869.325197,False,0.0,False,1869.325197 +08c4ae76-62af-48ac-bdaa-a03318c56d41,claude-sonnet-4-20250514,anthropic,gpt2-codegolf,12313,13793,26106,901.220506,False,0.0,claude-sonnet-4-20250514,gpt2-codegolf,901.220506,False,0.0,False,901.220506 +ffb59b60-5052-4275-b34a-1fa69d9475fe,gpt-5,openai,vulnerable-secret,9169,5369,14538,901.358977,False,0.0,gpt-5,vulnerable-secret,901.358977,False,0.2857142857142857,False,901.358977 +26610c59-e092-4e30-8263-2d73408b077c,grok-code-fast-1,xai,polyglot-c-py,0,0,0,900.001487,False,0.0,grok-code-fast-1,polyglot-c-py,900.001487,False,0.0,False,900.001487 +b36aa925-62d4-4629-a715-223f7c7283f0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,chess-best-move,4010,2112,6122,905.009129,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,chess-best-move,905.009129,False,0.0,False,905.009129 +5548f677-e049-4164-9c74-ae2309d1b26b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,adaptive-rejection-sampler,11723,4617,16340,905.534168,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,adaptive-rejection-sampler,905.534168,False,0.0,False,905.534168 +eaef5204-48b0-4172-9113-61aded1ad775,gpt-5-mini,openai,polyglot-rust-c,5167,7105,12272,919.401645,False,0.0,gpt-5-mini,polyglot-rust-c,919.401645,False,0.0,False,919.401645 +7531ff46-7cd9-48f4-83ad-f49a225e5d54,gpt-5-nano,openai,build-initramfs-qemu,9800,9475,19275,914.555972,False,0.0,gpt-5-nano,build-initramfs-qemu,914.555972,False,0.0,False,914.555972 +d77d25a3-d14a-49cf-9b61-1bd93315d651,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-mips-interpreter,13940,12185,26125,1800.767036,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-mips-interpreter,1800.767036,False,0.0,False,1800.767036 +4ffafc8b-7fd7-45fb-ad20-22d8216006bd,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,train-fasttext,11200,5124,16324,1005.663952,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,train-fasttext,1005.663952,False,0.0,False,1005.663952 +acac0e33-8058-4f0e-8df6-8d3a509615cb,grok-code-fast-1,xai,pytorch-model-cli,9664,3757,13421,751.040226,False,0.0,grok-code-fast-1,pytorch-model-cli,751.040226,False,0.0,False,751.040226 +d83d993e-0600-4854-b8d2-213ce62d19ff,claude-sonnet-4-20250514,anthropic,code-from-image,6426,6227,12653,502.339511,False,0.0,claude-sonnet-4-20250514,code-from-image,502.339511,False,0.2,False,502.339511 +a0584ffb-489b-4a7d-8173-fd06e52e58a3,gemini-2.5-flash,gemini,model-extraction-relu-logits,4278,4008,8286,233.88401,False,0.0,gemini-2.5-flash,model-extraction-relu-logits,233.88401,False,0.2,False,233.88401 +aa577c68-82a4-4e92-beaf-6cd39e73dd1b,gpt-5,openai,crack-7z-hash,7882,4822,12704,693.078611,False,0.0,gpt-5,crack-7z-hash,693.078611,False,0.4285714285714285,False,693.078611 +55beffa3-bc8c-4001-8726-fadc1fb3b5dc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,hf-model-inference,3697,1347,5044,109.809239,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,hf-model-inference,109.809239,True,0.8,True,109.809239 +aa59ad01-e2ee-4f80-aa45-0d725fa8a7e5,openai/gpt-oss-120b,together_ai,build-pov-ray,12457,6619,19076,1982.660405,False,0.0,openai/gpt-oss-120b,build-pov-ray,1982.660405,False,0.0,False,1982.660405 +471a897c-ef65-47bc-a26d-f60139da84b6,gpt-5,openai,break-filter-js-from-html,2742,1295,4037,437.814998,False,0.0,gpt-5,break-filter-js-from-html,437.814998,False,0.4285714285714285,False,437.814998 +6edbeb23-a268-4d4d-8b69-3470d7ee7fd8,openai/gpt-oss-120b,together_ai,openssl-selfsigned-cert,3060,2338,5398,138.642155,True,1.0,openai/gpt-oss-120b,openssl-selfsigned-cert,138.642155,True,0.8,True,138.642155 +eb6bc6bc-0941-4e03-8ae8-6fc3a3941013,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-differential-cryptanalysis,17185,18468,35653,1800.032216,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-differential-cryptanalysis,1800.032216,False,0.0,False,1800.032216 +39bb1cc9-64bf-48c5-b4ba-488d0b480755,moonshotai/Kimi-K2-Instruct-0905,together_ai,adaptive-rejection-sampler,12620,11657,24277,900.040032,False,0.0,moonshotai/Kimi-K2-Instruct-0905,adaptive-rejection-sampler,900.040032,False,0.0,False,900.040032 +09a56d5c-89e8-4256-b590-c3fee3bd55c8,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-cython-ext,18295,6848,25143,745.966361,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-cython-ext,745.966361,False,0.0,False,745.966361 +56725b80-24a6-40b8-93a0-3a1a48cc0bb5,gemini-2.5-flash,gemini,reverse-engineering,22508,18345,40853,1805.078216,False,0.0,gemini-2.5-flash,reverse-engineering,1805.078216,False,0.0,False,1805.078216 +fa04e5ef-1582-4f5a-a06f-13209cd53795,gpt-5,openai,code-from-image,9244,5831,15075,428.287744,True,1.0,gpt-5,code-from-image,428.287744,True,0.4,True,428.287744 +b8db9335-78b1-4bed-b311-101d54fe3041,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pypi-server,9254,5175,14429,900.033032,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pypi-server,900.033032,False,0.0,False,900.033032 +1d797159-d8ee-4ff3-907b-82bdc431a0d4,gpt-5,openai,log-summary-date-ranges,5838,2007,7845,273.448434,False,0.0,gpt-5,log-summary-date-ranges,273.448434,False,0.0,False,273.448434 +5012fde6-6065-4285-902b-080179fcbfed,openai/gpt-oss-120b,together_ai,nginx-request-logging,3817,1895,5712,150.540703,False,0.0,openai/gpt-oss-120b,nginx-request-logging,150.540703,False,0.4,False,150.540703 +2f822d19-327a-4092-a057-2cb2d707c402,claude-opus-4-1-20250805,anthropic,cobol-modernization,5148,3982,9130,133.045817,True,1.0,claude-opus-4-1-20250805,cobol-modernization,133.045817,True,0.875,True,133.045817 +7c66249f-7d19-4818-99bc-6b18ffbbf48b,gpt-5,openai,pytorch-model-cli,2835,3863,6698,380.339611,False,0.0,gpt-5,pytorch-model-cli,380.339611,False,0.0,False,380.339611 +4fa68048-81b8-4d1c-bdf6-1f9498e5435b,claude-sonnet-4-20250514,anthropic,dna-insert,12476,8773,21249,360.095015,False,0.0,claude-sonnet-4-20250514,dna-insert,360.095015,False,0.0,False,360.095015 +55989932-54ad-4b20-bc1a-cb12e52bbac5,gemini-2.5-flash,gemini,configure-git-webserver,7025,1334,8359,215.560349,False,0.0,gemini-2.5-flash,configure-git-webserver,215.560349,False,0.0,False,215.560349 +1faac076-907e-4c45-9e86-fd361c6067bb,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-assembly,9174,6450,15624,730.336173,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-assembly,730.336173,False,0.0,False,730.336173 +7a93d903-572d-4a46-a2a5-2f0d113bc701,gpt-5-mini,openai,wasm-pipeline,9481,9257,18738,911.05486,False,0.0,gpt-5-mini,wasm-pipeline,911.05486,False,0.6,False,911.05486 +6a1b95d7-3235-4bcf-bf84-e3a8d67beb3f,claude-opus-4-1-20250805,anthropic,pytorch-model-recovery,9022,6380,15402,902.161826,True,1.0,claude-opus-4-1-20250805,pytorch-model-recovery,902.161826,True,1.0,True,902.161826 +b7690543-5521-48f5-8444-6a71335383cd,openai/gpt-oss-120b,together_ai,distribution-search,2049,2234,4283,89.602971,False,0.0,openai/gpt-oss-120b,distribution-search,89.602971,False,0.0,False,89.602971 +1a7e41ab-4ed6-4c9f-b48c-cc31233ad18e,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-cli,4030,5104,9134,1198.713508,False,0.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-cli,1198.713508,False,0.0,False,1198.713508 +70c077a3-acb3-4766-b887-a3ee5e3a0fa7,grok-4-0709,xai,model-extraction-relu-logits,852,296,1148,1164.229483,False,0.0,grok-4-0709,model-extraction-relu-logits,1164.229483,False,0.0,False,1164.229483 +2adc6d64-018c-4698-a43f-d221ba4ba398,grok-code-fast-1,xai,make-doom-for-mips,20606,4028,24634,900.568042,False,0.0,grok-code-fast-1,make-doom-for-mips,900.568042,False,0.0,False,900.568042 +d952d7a4-2aa4-4256-b940-ff8bc21d7a87,zai-org/GLM-4.5-Air-FP8,together_ai,fix-ocaml-gc,45132,40046,85178,3341.003226,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-ocaml-gc,3341.003226,False,0.0,False,3341.003226 +0e064c95-5952-48c4-a446-b36343aef6d4,OpenAI/gpt-oss-20B,together_ai,build-pmars,344,2586,2930,93.49419,False,0.0,OpenAI/gpt-oss-20B,build-pmars,93.49419,False,0.0,False,93.49419 +a16a7f97-95db-440a-a0fa-8c634070f020,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-recovery,9047,6393,15440,903.378763,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-recovery,903.378763,True,0.8,True,903.378763 +23c6deb2-a46c-4d51-bf96-d226c14c5a80,moonshotai/Kimi-K2-Instruct-0905,together_ai,winning-avg-corewars,15660,15868,31528,2585.892994,False,0.0,moonshotai/Kimi-K2-Instruct-0905,winning-avg-corewars,2585.892994,False,0.0,False,2585.892994 +eedbf001-f093-4294-9075-39bd749df56e,gemini-2.5-flash,gemini,pytorch-model-cli,2756,1715,4471,159.941768,False,0.0,gemini-2.5-flash,pytorch-model-cli,159.941768,False,0.0,False,159.941768 +9a906fc2-4488-481e-963a-ffa0e26868ed,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,winning-avg-corewars,6810,4793,11603,410.815988,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,winning-avg-corewars,410.815988,False,0.0,False,410.815988 +64e07463-a844-42bf-a4b9-1fa96080a741,openai/gpt-oss-120b,together_ai,install-klee-minimal,2329,2556,4885,900.002167,False,0.0,openai/gpt-oss-120b,install-klee-minimal,900.002167,False,0.0,False,900.002167 +6aabb34e-4f54-4658-a7d1-a4a438907b84,zai-org/GLM-4.5-Air-FP8,together_ai,port-compressor,40421,26336,66757,3607.651755,False,0.0,zai-org/GLM-4.5-Air-FP8,port-compressor,3607.651755,False,0.0,False,3607.651755 +4ce324e8-aa9f-4215-a07c-8dc7bd4e0b75,grok-4-0709,xai,install-klee-minimal,10109,2196,12305,900.096919,False,0.0,grok-4-0709,install-klee-minimal,900.096919,False,0.0,False,900.096919 +e58c4f52-1525-4447-be83-e8d6da9965f2,openai/gpt-oss-120b,together_ai,path-tracing-reverse,22258,14923,37181,1816.060844,False,0.0,openai/gpt-oss-120b,path-tracing-reverse,1816.060844,False,0.0,False,1816.060844 +a76c1ffd-65f5-4a2a-827d-42e0cc3625d9,gemini-2.5-pro,gemini,financial-document-processor,12161,5654,17815,557.748855,False,0.0,gemini-2.5-pro,financial-document-processor,557.748855,False,0.0,False,557.748855 +d83f9dd9-f8c1-439b-84b7-01b10a3d864d,moonshotai/Kimi-K2-Instruct-0905,together_ai,port-compressor,64203,44519,108722,3600.001018,False,0.0,moonshotai/Kimi-K2-Instruct-0905,port-compressor,3600.001018,False,0.0,False,3600.001018 +13b2b7d7-4c63-47a0-b38f-8f95e3b370ab,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,model-extraction-relu-logits,11862,12121,23983,827.348843,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,model-extraction-relu-logits,827.348843,False,0.0,False,827.348843 +4d81f75d-8f9f-4466-92d8-310acfb90546,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,tune-mjcf,14991,9019,24010,926.874961,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,tune-mjcf,926.874961,False,0.0,False,926.874961 +0dfb13e5-503a-4d44-a304-9c8914aa3460,claude-opus-4-1-20250805,anthropic,dna-assembly,24171,15922,40093,724.926875,False,0.0,claude-opus-4-1-20250805,dna-assembly,724.926875,False,0.0,False,724.926875 +69cd9f98-6da5-4c76-ad99-d47dabe2afcf,gpt-5-nano,openai,fix-code-vulnerability,7594,5248,12842,901.082412,False,0.0,gpt-5-nano,fix-code-vulnerability,901.082412,False,0.2,False,901.082412 +b3ca475f-a346-4ba2-86d3-4560fffc7555,openai/gpt-oss-120b,together_ai,distribution-search,1936,2091,4027,83.750681,False,0.0,openai/gpt-oss-120b,distribution-search,83.750681,False,0.0,False,83.750681 +149e1f1d-29c5-4b3b-b165-6f22abc80bc5,gpt-5,openai,install-klee-minimal,1637,1735,3372,900.153186,False,0.0,gpt-5,install-klee-minimal,900.153186,False,0.0,False,900.153186 +665c7647-871f-4cdd-bcca-aeb4f9814ca5,gpt-5,openai,wasm-pipeline,8378,8188,16566,334.868496,True,1.0,gpt-5,wasm-pipeline,334.868496,True,1.0,True,334.868496 +6996ed8b-bfcb-4daa-af5a-cbeea8248184,openai/gpt-oss-120b,together_ai,install-klee-minimal,5941,3599,9540,906.714287,False,0.0,openai/gpt-oss-120b,install-klee-minimal,906.714287,False,0.0,False,906.714287 +855d8bb1-5772-445b-925e-19be7213974e,claude-sonnet-4-20250514,anthropic,schemelike-metacircular-eval,40807,32830,73637,2402.966717,False,0.0,claude-sonnet-4-20250514,schemelike-metacircular-eval,2402.966717,False,0.0,False,2402.966717 +aaf2e8ee-6a7a-4aca-966d-71d622dba3de,gpt-5,openai,build-pmars,9722,4252,13974,941.314624,False,0.0,gpt-5,build-pmars,941.314624,False,0.8,False,941.314624 +060c3b7f-3ca7-4d76-9679-50f464e8ee2a,OpenAI/gpt-oss-20B,together_ai,bn-fit-modify,176,210,386,254.911604,False,0.0,OpenAI/gpt-oss-20B,bn-fit-modify,254.911604,False,0.0,False,254.911604 +6ebac9dd-0263-486c-8321-3f14341cf178,grok-code-fast-1,xai,code-from-image,7796,3766,11562,254.830644,False,0.0,grok-code-fast-1,code-from-image,254.830644,False,0.0,False,254.830644 +747858f2-7163-4aa8-ab35-9107d5fac434,grok-4-0709,xai,break-filter-js-from-html,2138,1924,4062,1218.204018,False,0.0,grok-4-0709,break-filter-js-from-html,1218.204018,False,0.0,False,1218.204018 +53e4ab75-260d-4300-afc6-93a74d677755,gemini-2.5-flash,gemini,dna-insert,16252,11892,28144,396.535286,False,0.0,gemini-2.5-flash,dna-insert,396.535286,False,0.0,False,396.535286 +d2fa32bd-4c64-4b4d-b159-2cf3daf2b5e4,claude-sonnet-4-20250514,anthropic,cancel-async-tasks,2290,1807,4097,130.056178,True,1.0,claude-sonnet-4-20250514,cancel-async-tasks,130.056178,True,0.8,True,130.056178 +ff2d32cc-c8bc-45b4-ad79-92dfc7d1eba4,claude-opus-4-1-20250805,anthropic,run-pdp11-code,7391,5786,13177,599.3209,False,0.0,claude-opus-4-1-20250805,run-pdp11-code,599.3209,False,0.0,False,599.3209 +5f1d3157-e56b-481d-b703-97aca3d9908c,zai-org/GLM-4.5-Air-FP8,together_ai,fix-code-vulnerability,19280,10547,29827,907.45893,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-code-vulnerability,907.45893,False,0.0,False,907.45893 +7fc0b3c6-c172-4ad1-82c0-8cc16c9f0746,claude-sonnet-4-20250514,anthropic,reverse-engineering,23686,17648,41334,1800.534735,False,0.0,claude-sonnet-4-20250514,reverse-engineering,1800.534735,False,0.0,False,1800.534735 +4f7db1d1-290c-4f6e-994a-ef7251203e4d,OpenAI/gpt-oss-20B,together_ai,feal-differential-cryptanalysis,445,2698,3143,276.480175,False,0.0,OpenAI/gpt-oss-20B,feal-differential-cryptanalysis,276.480175,False,0.0,False,276.480175 +f28927a8-6e4c-45c7-918b-24048dcc416a,deepseek-ai/DeepSeek-V3.1,together_ai,run-pdp11-code,16519,11979,28498,613.385989,False,0.0,deepseek-ai/DeepSeek-V3.1,run-pdp11-code,613.385989,False,0.0,False,613.385989 +ab4c763a-bf90-41f6-a18b-a1ae0858d47e,claude-sonnet-4-20250514,anthropic,make-mips-interpreter,29887,20363,50250,1802.642155,False,0.0,claude-sonnet-4-20250514,make-mips-interpreter,1802.642155,False,0.0,False,1802.642155 +0473ee54-0c86-4581-8902-a4fb39b92a88,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-linear-cryptanalysis,6737,1505,8242,167.917433,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-linear-cryptanalysis,167.917433,False,0.0,False,167.917433 +185c144f-e5f0-4413-8a71-980d641d7b3a,claude-opus-4-1-20250805,anthropic,db-wal-recovery,10036,9793,19829,364.409,False,0.0,claude-opus-4-1-20250805,db-wal-recovery,364.409,False,0.0,False,364.409 +2880e3b8-6709-4818-b186-a00f298614f9,zai-org/GLM-4.5-Air-FP8,together_ai,bn-fit-modify,25184,14064,39248,902.013699,False,0.0,zai-org/GLM-4.5-Air-FP8,bn-fit-modify,902.013699,False,0.0,False,902.013699 +84aa667d-cc24-4886-9042-33872de44c29,deepseek-ai/DeepSeek-V3.1,together_ai,fix-git,4422,2462,6884,688.741257,True,1.0,deepseek-ai/DeepSeek-V3.1,fix-git,688.741257,True,0.8,True,688.741257 +d2458b21-a700-4b66-929c-faf70a4307fe,zai-org/GLM-4.5-Air-FP8,together_ai,wasm-pipeline,9587,10627,20214,366.979884,True,1.0,zai-org/GLM-4.5-Air-FP8,wasm-pipeline,366.979884,True,0.2,True,366.979884 +0d167cd0-381d-4a6d-a377-91cbfb270860,moonshotai/Kimi-K2-Instruct-0905,together_ai,train-fasttext,21097,9707,30804,3606.317587,False,0.0,moonshotai/Kimi-K2-Instruct-0905,train-fasttext,3606.317587,False,0.2,False,3606.317587 +6d82c420-6c4b-4a56-9bee-b5848d2d647e,gemini-2.5-pro,gemini,crack-7z-hash,15768,3534,19302,723.035224,True,1.0,gemini-2.5-pro,crack-7z-hash,723.035224,True,0.8,True,723.035224 +c3ab2e21-8e5b-44e2-8cec-711608eb807a,grok-4-0709,xai,feal-differential-cryptanalysis,2447,1505,3952,768.951183,True,1.0,grok-4-0709,feal-differential-cryptanalysis,768.951183,True,0.8,True,768.951183 +87b22db2-265d-45f7-b9f4-223e7a92e3cc,gpt-5,openai,port-compressor,18725,23315,42040,3606.570665,False,0.0,gpt-5,port-compressor,3606.570665,False,0.0,False,3606.570665 +e2d13ced-cf43-4c98-b974-110ab55f648e,deepseek-ai/DeepSeek-V3.1,together_ai,build-initramfs-qemu,8221,7743,15964,900.191695,False,0.0,deepseek-ai/DeepSeek-V3.1,build-initramfs-qemu,900.191695,False,0.0,False,900.191695 +db61f49d-ce3e-4f96-812c-9cb20d653a42,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,form-filling,18075,15423,33498,900.704781,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,form-filling,900.704781,False,0.8,False,900.704781 +f293590c-d771-456a-8b24-c5cc2b11256a,openai/gpt-oss-120b,together_ai,mteb-retrieve,1781,789,2570,118.904306,False,0.0,openai/gpt-oss-120b,mteb-retrieve,118.904306,False,0.0,False,118.904306 +e32b93fd-1ba5-4760-b14b-b6ab067ae1fc,deepseek-ai/DeepSeek-V3.1,together_ai,configure-git-webserver,11704,3640,15344,383.410069,True,1.0,deepseek-ai/DeepSeek-V3.1,configure-git-webserver,383.410069,True,1.0,True,383.410069 +9c4ba46a-0d68-438f-9054-586208a13874,openai/gpt-oss-120b,together_ai,vulnerable-secret,1807,2506,4313,901.435665,False,0.0,openai/gpt-oss-120b,vulnerable-secret,901.435665,False,0.0,False,901.435665 +6acb8f19-5cdf-4c95-aecd-d333814cbe57,claude-opus-4-1-20250805,anthropic,run-pdp11-code,11206,6934,18140,1028.544067,False,0.0,claude-opus-4-1-20250805,run-pdp11-code,1028.544067,False,0.0,False,1028.544067 +61ef7093-b1fa-4d69-9ce6-92721df3d9da,OpenAI/gpt-oss-20B,together_ai,merge-diff-arc-agi-task,827,4361,5188,900.320443,False,0.0,OpenAI/gpt-oss-20B,merge-diff-arc-agi-task,900.320443,False,0.0,False,900.320443 +d0c97676-7b11-4025-9c0c-a294941592db,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,circuit-fibsqrt,15111,12868,27979,896.27068,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,circuit-fibsqrt,896.27068,False,0.0,False,896.27068 +142f0af5-5153-4871-bef3-eef70b2bba15,claude-opus-4-1-20250805,anthropic,build-pov-ray,17182,5030,22212,912.703749,True,1.0,claude-opus-4-1-20250805,build-pov-ray,912.703749,True,0.75,True,912.703749 +d67b5259-a4f2-495a-9a12-2e569af745e7,grok-code-fast-1,xai,train-fasttext,18217,6192,24409,2912.105278,False,0.0,grok-code-fast-1,train-fasttext,2912.105278,False,0.0,False,2912.105278 +758dff0f-500d-43a1-863a-744a5ac2b0f1,gemini-2.5-pro,gemini,pytorch-model-recovery,11214,3527,14741,275.47569,True,1.0,gemini-2.5-pro,pytorch-model-recovery,275.47569,True,1.0,True,275.47569 +793f0a0a-4a22-46ce-933f-fa7649fb8af2,gpt-5-mini,openai,fix-code-vulnerability,10313,8050,18363,967.265609,False,0.0,gpt-5-mini,fix-code-vulnerability,967.265609,False,0.0,False,967.265609 +c4d4b96e-1911-4eb9-9763-44bf668f7a4f,moonshotai/Kimi-K2-Instruct-0905,together_ai,form-filling,7313,6644,13957,347.424744,True,1.0,moonshotai/Kimi-K2-Instruct-0905,form-filling,347.424744,True,0.8,True,347.424744 +1aa25fb9-a79a-477b-b626-47ffc541a59f,gpt-5,openai,build-pmars,12568,4303,16871,670.429353,True,1.0,gpt-5,build-pmars,670.429353,True,0.8,True,670.429353 +00dde788-6d08-4d72-952f-c1605da7bc3b,gemini-2.5-flash,gemini,vulnerable-secret,5541,3228,8769,907.901601,False,0.0,gemini-2.5-flash,vulnerable-secret,907.901601,False,0.0,False,907.901601 +716eaecb-5fcf-4eb8-b9db-12cab2900664,gpt-5,openai,filter-js-from-html,2839,3029,5868,246.87478,False,0.0,gpt-5,filter-js-from-html,246.87478,False,0.0,False,246.87478 +735d02ac-4a7f-41d6-89de-177acbdfe2dc,OpenAI/gpt-oss-20B,together_ai,build-initramfs-qemu,150,1428,1578,260.08733,False,0.0,OpenAI/gpt-oss-20B,build-initramfs-qemu,260.08733,False,0.0,False,260.08733 +bd046d7a-136a-4ff1-9dec-2959cd91a50a,openai/gpt-oss-120b,together_ai,dna-insert,9039,5763,14802,631.457432,False,0.0,openai/gpt-oss-120b,dna-insert,631.457432,False,0.0,False,631.457432 +1b7caa96-896f-488a-aff7-6be227b82c8e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-initramfs-qemu,8342,5246,13588,501.99624,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-initramfs-qemu,501.99624,False,0.0,False,501.99624 +3d39b1b7-6f24-46d6-bf79-23703ede6295,OpenAI/gpt-oss-20B,together_ai,fix-code-vulnerability,0,0,0,1013.047545,False,0.0,OpenAI/gpt-oss-20B,fix-code-vulnerability,1013.047545,False,0.0,False,1013.047545 +1a57f12e-dacc-4078-ab30-3eb016ba3cec,gemini-2.5-pro,gemini,run-pdp11-code,9687,3075,12762,399.718383,False,0.0,gemini-2.5-pro,run-pdp11-code,399.718383,False,0.0,False,399.718383 +c0311797-999a-4830-bc01-b1e54e30bc73,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,port-compressor,21370,6024,27394,3601.871482,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,port-compressor,3601.871482,False,0.0,False,3601.871482 +aa5398fa-5ba3-4216-9a7e-23b9d94b92b2,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,gpt2-codegolf,7585,4194,11779,245.821412,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,gpt2-codegolf,245.821412,False,0.0,False,245.821412 +18c5e280-cd7b-42a3-8625-6a1fbd4d6efa,grok-4-0709,xai,pytorch-model-cli,9476,4027,13503,603.207313,True,1.0,grok-4-0709,pytorch-model-cli,603.207313,True,0.6,True,603.207313 +54313854-adce-47de-9c1c-9993e95a3b4f,claude-sonnet-4-20250514,anthropic,path-tracing-reverse,13732,13350,27082,1486.747992,False,0.0,claude-sonnet-4-20250514,path-tracing-reverse,1486.747992,False,0.0,False,1486.747992 +2ead6217-9dce-439d-8ba7-f6af67734429,grok-4-0709,xai,log-summary-date-ranges,2204,2464,4668,561.700113,False,0.0,grok-4-0709,log-summary-date-ranges,561.700113,False,0.0,False,561.700113 +55714eef-d2c2-4210-ba57-a7c3728c5304,claude-opus-4-1-20250805,anthropic,pytorch-model-recovery,8029,5032,13061,274.897067,True,1.0,claude-opus-4-1-20250805,pytorch-model-recovery,274.897067,True,1.0,True,274.897067 +07abddd0-8a13-4559-a31b-137e7b339203,claude-opus-4-1-20250805,anthropic,break-filter-js-from-html,9607,9602,19209,1220.980814,False,0.0,claude-opus-4-1-20250805,break-filter-js-from-html,1220.980814,False,0.2222222222222222,False,1220.980814 +7c7d3303-e31f-46bf-8fe6-a7831ee0e973,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,configure-git-webserver,10242,1651,11893,217.175653,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,configure-git-webserver,217.175653,False,0.6,False,217.175653 +17fe88ee-476b-4399-9160-163d1a4d6018,gpt-5-mini,openai,make-doom-for-mips,16116,4359,20475,906.577662,False,0.0,gpt-5-mini,make-doom-for-mips,906.577662,False,0.0,False,906.577662 +95fdc1a7-ef46-44fe-93b4-d1b20c433e3f,grok-4-0709,xai,openssl-selfsigned-cert,1687,1012,2699,163.036398,False,0.0,grok-4-0709,openssl-selfsigned-cert,163.036398,False,0.0,False,163.036398 +d58a333c-c74e-41d6-9062-21be85c74b1e,openai/gpt-oss-120b,together_ai,cobol-modernization,5127,3557,8684,172.744965,True,1.0,openai/gpt-oss-120b,cobol-modernization,172.744965,True,0.8,True,172.744965 +dbf42741-22a3-484a-aea8-586d8771719d,moonshotai/Kimi-K2-Instruct-0905,together_ai,break-filter-js-from-html,9210,12744,21954,1214.264073,False,0.0,moonshotai/Kimi-K2-Instruct-0905,break-filter-js-from-html,1214.264073,False,0.0,False,1214.264073 +b14de3d6-fff4-4d05-a26f-e81a3eb314b4,grok-code-fast-1,xai,prove-plus-comm,1748,1607,3355,93.848716,True,1.0,grok-code-fast-1,prove-plus-comm,93.848716,True,0.4,True,93.848716 +ec0abb8c-d882-4b9a-8944-8bdfe6f664ec,gemini-2.5-pro,gemini,sparql-university,5497,1833,7330,127.174053,True,1.0,gemini-2.5-pro,sparql-university,127.174053,True,0.6,True,127.174053 +f8204e16-9b97-4616-a709-4c978e18f931,grok-code-fast-1,xai,hf-model-inference,3669,1236,4905,84.616999,False,0.0,grok-code-fast-1,hf-model-inference,84.616999,False,0.4,False,84.616999 +91735112-00ac-4875-8de9-b2f1e7aba7a3,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-c-py,12232,10789,23021,911.513251,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-c-py,911.513251,False,0.0,False,911.513251 +e0b75daa-1c65-4263-86ac-646d7906e36b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,gpt2-codegolf,2737,2668,5405,242.081573,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,gpt2-codegolf,242.081573,False,0.0,False,242.081573 +5f96c7f8-c590-4f5b-a61d-dae288a58ff9,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-cython-ext,7560,2943,10503,907.262655,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-cython-ext,907.262655,False,0.0,False,907.262655 +18aab19a-ca7e-444b-8372-dda7abb9b3f9,OpenAI/gpt-oss-20B,together_ai,build-pov-ray,602,1992,2594,250.990985,False,0.0,OpenAI/gpt-oss-20B,build-pov-ray,250.990985,False,0.0,False,250.990985 +1819721b-f274-40fc-b555-94bfc70da60a,grok-code-fast-1,xai,circuit-fibsqrt,8601,8599,17200,283.542628,False,0.0,grok-code-fast-1,circuit-fibsqrt,283.542628,False,0.0,False,283.542628 +0ee9d999-cb3c-465b-8bfa-4556a81d1c5b,grok-code-fast-1,xai,wasm-pipeline,9722,2379,12101,737.068533,False,0.0,grok-code-fast-1,wasm-pipeline,737.068533,False,0.2,False,737.068533 +fec4817a-e77d-44b2-b74b-d9ae33b124a4,gpt-5,openai,large-scale-text-editing,5665,1956,7621,148.21879,True,1.0,gpt-5,large-scale-text-editing,148.21879,True,0.4285714285714285,True,148.21879 +59c845bf-6cb8-4d6f-83ef-5f79804aa926,claude-opus-4-1-20250805,anthropic,mteb-leaderboard,1973,2327,4300,457.663343,False,0.0,claude-opus-4-1-20250805,mteb-leaderboard,457.663343,False,0.0,False,457.663343 +cb6167f6-5a39-4e8d-8579-506414cb37be,gpt-5,openai,constraints-scheduling,3560,1481,5041,192.297308,True,1.0,gpt-5,constraints-scheduling,192.297308,True,0.8571428571428571,True,192.297308 +41634c72-f817-4506-aa31-7e4de3ed8582,claude-opus-4-1-20250805,anthropic,reshard-c4-data,8741,5883,14624,900.00652,False,0.0,claude-opus-4-1-20250805,reshard-c4-data,900.00652,False,0.0,False,900.00652 +67484e4e-39b0-4977-b1cf-317583dbb287,openai/gpt-oss-120b,together_ai,gpt2-codegolf,2590,6215,8805,910.407775,False,0.0,openai/gpt-oss-120b,gpt2-codegolf,910.407775,False,0.0,False,910.407775 +c84ff7ef-2609-476d-8adc-61c58e43c6b4,moonshotai/Kimi-K2-Instruct-0905,together_ai,prove-plus-comm,2422,2718,5140,901.598533,False,0.0,moonshotai/Kimi-K2-Instruct-0905,prove-plus-comm,901.598533,False,0.8,False,901.598533 +976bea3b-4536-4fcc-9723-2fc0d1cfd50b,gpt-5,openai,db-wal-recovery,12421,10398,22819,924.188288,False,0.0,gpt-5,db-wal-recovery,924.188288,False,0.1428571428571428,False,924.188288 +e075ac72-b6d5-4535-aae3-030b145348a4,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,crack-7z-hash,3893,2255,6148,184.537121,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,crack-7z-hash,184.537121,False,0.0,False,184.537121 +e4304038-2fb4-4b21-9153-7ce10fda6a58,gpt-5-mini,openai,tune-mjcf,13393,9814,23207,900.114155,False,0.0,gpt-5-mini,tune-mjcf,900.114155,False,0.0,False,900.114155 +f8c7c687-15a0-484a-b782-643a254ac90b,OpenAI/gpt-oss-20B,together_ai,path-tracing,2028,8804,10832,447.297145,False,0.0,OpenAI/gpt-oss-20B,path-tracing,447.297145,False,0.0,False,447.297145 +87d93e13-ab4a-4fe3-a171-c60698fafd88,grok-4-0709,xai,torch-tensor-parallelism,1697,937,2634,306.449619,False,0.0,grok-4-0709,torch-tensor-parallelism,306.449619,False,0.0,False,306.449619 +989b4cfe-2edf-4000-bfde-902f45637d88,deepseek-ai/DeepSeek-V3.1,together_ai,configure-git-webserver,7134,2045,9179,326.769556,True,1.0,deepseek-ai/DeepSeek-V3.1,configure-git-webserver,326.769556,True,1.0,True,326.769556 +c255282b-22d1-47b2-a359-a4e70e592ee5,gpt-5-mini,openai,polyglot-c-py,2240,2711,4951,900.001983,False,0.0,gpt-5-mini,polyglot-c-py,900.001983,False,0.0,False,900.001983 +8dd02d32-814e-478d-a0d2-b0c821c6f2ec,grok-code-fast-1,xai,install-windows-3.11,5749,2210,7959,1112.760538,False,0.0,grok-code-fast-1,install-windows-3.11,1112.760538,False,0.0,False,1112.760538 +06458568-ee0f-499e-b3af-380fd4396614,grok-4-0709,xai,model-extraction-relu-logits,1949,1407,3356,848.49283,False,0.0,grok-4-0709,model-extraction-relu-logits,848.49283,False,0.0,False,848.49283 +dab6079e-9216-41a5-8bcb-a520c600c34f,zai-org/GLM-4.5-Air-FP8,together_ai,crack-7z-hash,17621,4510,22131,904.448797,False,0.0,zai-org/GLM-4.5-Air-FP8,crack-7z-hash,904.448797,False,0.0,False,904.448797 +810031f6-3b2c-4382-ba5c-ff8e8d490ca1,zai-org/GLM-4.5-Air-FP8,together_ai,schemelike-metacircular-eval,7656,16021,23677,2430.088674,False,0.0,zai-org/GLM-4.5-Air-FP8,schemelike-metacircular-eval,2430.088674,False,0.0,False,2430.088674 +8d53738e-78fa-40a4-a012-104d00581289,gemini-2.5-flash,gemini,feal-linear-cryptanalysis,17670,37952,55622,1828.375895,False,0.0,gemini-2.5-flash,feal-linear-cryptanalysis,1828.375895,False,0.0,False,1828.375895 +269e2288-f545-497e-98a6-318d1b2a1cfb,gpt-5,openai,mteb-retrieve,2566,1320,3886,316.201927,False,0.0,gpt-5,mteb-retrieve,316.201927,False,0.0,False,316.201927 +85d65925-9c3c-405b-a8fc-8c40e6c2ab52,gemini-2.5-flash,gemini,make-mips-interpreter,4643,59423,64066,1800.722235,False,0.0,gemini-2.5-flash,make-mips-interpreter,1800.722235,False,0.0,False,1800.722235 +7e1f9aec-c1a5-4c77-9489-88a90ca767ad,gpt-5,openai,video-processing,3983,4170,8153,211.50711,False,0.0,gpt-5,video-processing,211.50711,False,0.0,False,211.50711 +2a604b79-7fec-47d4-8ad4-a79ab9d46ac3,moonshotai/Kimi-K2-Instruct-0905,together_ai,chess-best-move,11300,9636,20936,559.726776,False,0.0,moonshotai/Kimi-K2-Instruct-0905,chess-best-move,559.726776,False,0.0,False,559.726776 +f0a8e266-432f-44ca-a37d-b9f570968edc,claude-opus-4-1-20250805,anthropic,schemelike-metacircular-eval,45125,53090,98215,2407.978294,False,0.0,claude-opus-4-1-20250805,schemelike-metacircular-eval,2407.978294,False,0.0,False,2407.978294 +fdf2e318-f7d6-4ad5-bb3f-3dbb1dc3caab,claude-opus-4-1-20250805,anthropic,build-initramfs-qemu,30807,9680,40487,915.374893,False,0.0,claude-opus-4-1-20250805,build-initramfs-qemu,915.374893,False,0.0,False,915.374893 +908fd45f-ef96-49cb-9c88-7514f3f59e98,grok-code-fast-1,xai,install-windows-3.11,8434,3207,11641,222.356272,False,0.0,grok-code-fast-1,install-windows-3.11,222.356272,False,0.0,False,222.356272 +639ce984-cf12-41cc-ae92-21d7b63f7f30,OpenAI/gpt-oss-20B,together_ai,build-initramfs-qemu,1437,1100,2537,76.339363,False,0.0,OpenAI/gpt-oss-20B,build-initramfs-qemu,76.339363,False,0.0,False,76.339363 +19d8c536-6f18-4fa9-913f-ae2fc6de081b,claude-sonnet-4-20250514,anthropic,dna-insert,10743,5466,16209,376.229573,False,0.0,claude-sonnet-4-20250514,dna-insert,376.229573,False,0.0,False,376.229573 +986fdea7-2ccf-45aa-845e-47b004b01fbe,gemini-2.5-flash,gemini,code-from-image,8459,4633,13092,279.361533,False,0.0,gemini-2.5-flash,code-from-image,279.361533,False,0.4,False,279.361533 +5e091d0c-f174-4d2e-8459-f389aa1e56a8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sparql-university,7999,2199,10198,740.661314,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sparql-university,740.661314,False,0.0,False,740.661314 +d7698122-e62a-4fe9-b957-7f78bc30e1d3,gpt-5,openai,cancel-async-tasks,1549,874,2423,180.043629,False,0.0,gpt-5,cancel-async-tasks,180.043629,False,0.6,False,180.043629 +c37d6317-c16e-43d4-842e-c6099c93f886,gemini-2.5-flash,gemini,port-compressor,23730,21183,44913,3601.932202,False,0.0,gemini-2.5-flash,port-compressor,3601.932202,False,0.0,False,3601.932202 +aaac5bd2-2d9a-48ae-b23a-2f7db5e77c15,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-retrieve,2511,1226,3737,214.508221,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-retrieve,214.508221,False,0.0,False,214.508221 +29748f49-c251-4ddd-a308-cb928cc39b5e,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,log-summary-date-ranges,4073,1472,5545,128.638703,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,log-summary-date-ranges,128.638703,False,0.0,False,128.638703 +3fc364b4-bc33-49df-8469-ea7143b0a987,claude-opus-4-1-20250805,anthropic,merge-diff-arc-agi-task,12257,4729,16986,950.452803,False,0.0,claude-opus-4-1-20250805,merge-diff-arc-agi-task,950.452803,False,0.3333333333333333,False,950.452803 +d9be9628-abe8-4272-80c1-b785230e27fa,claude-sonnet-4-20250514,anthropic,dna-assembly,12444,7707,20151,755.008952,False,0.0,claude-sonnet-4-20250514,dna-assembly,755.008952,False,0.0,False,755.008952 +3182f1f2-49c3-417b-946c-117e2712bf7d,grok-4-0709,xai,hf-model-inference,4452,1270,5722,552.151505,True,1.0,grok-4-0709,hf-model-inference,552.151505,True,1.0,True,552.151505 +68d460e9-ba62-4b1b-8064-f2f5461eb415,OpenAI/gpt-oss-20B,together_ai,merge-diff-arc-agi-task,727,1720,2447,152.628457,False,0.0,OpenAI/gpt-oss-20B,merge-diff-arc-agi-task,152.628457,False,0.0,False,152.628457 +84c14f0a-0fca-4aa7-a9f1-ecf6f639be12,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-windows-3.11,14566,6918,21484,763.00718,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-windows-3.11,763.00718,False,0.0,False,763.00718 +b909de70-bc0e-44e2-8c7b-3cc1673d095b,grok-code-fast-1,xai,sparql-university,1516,889,2405,66.73889,False,0.0,grok-code-fast-1,sparql-university,66.73889,False,0.2,False,66.73889 +ce5acadf-52ac-46f1-9156-4e97bab3f8d5,gemini-2.5-flash,gemini,polyglot-c-py,1702,922,2624,570.089975,False,0.0,gemini-2.5-flash,polyglot-c-py,570.089975,False,0.0,False,570.089975 +7e0cf1d1-6a8c-464c-9cdc-1fef9e8c66fa,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-differential-cryptanalysis,25165,27609,52774,1271.928934,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-differential-cryptanalysis,1271.928934,False,0.0,False,1271.928934 +0edb2b34-cecf-4acb-af41-074d52ea8bc8,grok-4-0709,xai,openssl-selfsigned-cert,1682,951,2633,116.44857,False,0.0,grok-4-0709,openssl-selfsigned-cert,116.44857,False,0.0,False,116.44857 +cb7b9966-b944-41ca-8e17-b32721917949,gemini-2.5-pro,gemini,make-mips-interpreter,16884,18677,35561,1084.159161,False,0.0,gemini-2.5-pro,make-mips-interpreter,1084.159161,False,0.0,False,1084.159161 +e10ed5a2-5699-42b3-b392-0b39b79731fa,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pmars,14978,6854,21832,749.380596,True,1.0,moonshotai/Kimi-K2-Instruct-0905,build-pmars,749.380596,True,0.8,True,749.380596 +83ffc759-3c9a-425b-8702-d5ea5fb6e06e,grok-code-fast-1,xai,path-tracing,1521,1195,2716,900.052758,False,0.0,grok-code-fast-1,path-tracing,900.052758,False,0.0,False,900.052758 +06011a48-5bb2-4572-a348-5d57a1cca624,claude-sonnet-4-20250514,anthropic,path-tracing,2379,1225,3604,1806.632549,False,0.0,claude-sonnet-4-20250514,path-tracing,1806.632549,False,0.0,False,1806.632549 +1ca213e3-36ef-40ee-8a6b-56961e985a7a,gpt-5-nano,openai,bn-fit-modify,10906,6571,17477,918.295451,False,0.0,gpt-5-nano,bn-fit-modify,918.295451,False,0.0,False,918.295451 +183a74b1-e151-4dcb-a3eb-866e516d67a4,gemini-2.5-flash,gemini,polyglot-rust-c,1389,1754,3143,936.539184,False,0.0,gemini-2.5-flash,polyglot-rust-c,936.539184,False,0.0,False,936.539184 +938e8490-0734-4060-8e96-96cb4326be15,grok-code-fast-1,xai,cancel-async-tasks,1360,717,2077,99.131105,True,1.0,grok-code-fast-1,cancel-async-tasks,99.131105,True,0.2,True,99.131105 +a171470f-6272-4e3d-b8f3-9dbff056014a,gpt-5-nano,openai,password-recovery,3025,7972,10997,906.166665,False,0.0,gpt-5-nano,password-recovery,906.166665,False,0.0,False,906.166665 +c21d2c6a-a75b-4af2-9ef7-62d545054e62,gpt-5,openai,pytorch-model-recovery,6880,4811,11691,263.355408,True,1.0,gpt-5,pytorch-model-recovery,263.355408,True,0.4285714285714285,True,263.355408 +a4a62168-cb3a-4df7-8fe7-8f13eb40ca3b,grok-4-0709,xai,form-filling,3453,2436,5889,310.68523,False,0.0,grok-4-0709,form-filling,310.68523,False,0.2,False,310.68523 +a8c47109-9595-4109-a8b0-ba1fb8bd3f47,gemini-2.5-flash,gemini,filter-js-from-html,3203,21660,24863,900.006478,False,0.0,gemini-2.5-flash,filter-js-from-html,900.006478,False,0.0,False,900.006478 +d77ba50c-fa36-4768-b4f0-1c5e4ac1460b,gemini-2.5-pro,gemini,sqlite-db-truncate,3616,2029,5645,203.311204,False,0.0,gemini-2.5-pro,sqlite-db-truncate,203.311204,False,0.0,False,203.311204 +d38d3fba-f8aa-4c1d-8c26-cd660d664238,claude-sonnet-4-20250514,anthropic,build-cython-ext,16181,6478,22659,900.255359,False,0.0,claude-sonnet-4-20250514,build-cython-ext,900.255359,False,0.0,False,900.255359 +4958dae9-e076-4be4-8684-c2640a38a643,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,regex-log,1181,977,2158,79.010063,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,regex-log,79.010063,False,0.0,False,79.010063 +a8f215e1-ed86-4396-9cf3-220dedb14464,grok-code-fast-1,xai,financial-document-processor,2900,2043,4943,87.683204,False,0.0,grok-code-fast-1,financial-document-processor,87.683204,False,0.0,False,87.683204 +32643ad4-56d3-45b3-9ec9-156cf2dee495,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,financial-document-processor,11189,6011,17200,575.294524,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,financial-document-processor,575.294524,False,0.0,False,575.294524 +bfb78a1a-8f3f-4dcf-bbfa-950deb3b93b7,claude-opus-4-1-20250805,anthropic,schemelike-metacircular-eval,31012,25868,56880,2403.425143,False,0.0,claude-opus-4-1-20250805,schemelike-metacircular-eval,2403.425143,False,0.0,False,2403.425143 +7c3c2db3-61e1-429e-9c59-316b6f963a11,openai/gpt-oss-120b,together_ai,wasm-pipeline,3361,6202,9563,345.992577,False,0.0,openai/gpt-oss-120b,wasm-pipeline,345.992577,False,0.0,False,345.992577 +9718e6fe-22ba-4edd-87e3-ef73453b249e,gpt-5,openai,form-filling,13735,35400,49135,905.86045,False,0.0,gpt-5,form-filling,905.86045,False,0.8,False,905.86045 +4e730c48-1027-46e4-8b31-b2663734536d,claude-opus-4-1-20250805,anthropic,fix-git,2096,1354,3450,52.513478,True,1.0,claude-opus-4-1-20250805,fix-git,52.513478,True,1.0,True,52.513478 +bc7ef71c-06b2-48df-9499-f36a9d76e93b,gpt-5,openai,make-mips-interpreter,14271,55875,70146,1800.206438,False,0.0,gpt-5,make-mips-interpreter,1800.206438,False,0.0,False,1800.206438 +93a64d85-0ac2-4f68-bd4c-ffe172219c49,zai-org/GLM-4.5-Air-FP8,together_ai,feal-differential-cryptanalysis,3270,2908,6178,140.430419,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-differential-cryptanalysis,140.430419,False,0.0,False,140.430419 +7403a09a-0fc1-451f-b066-27f71cd7562a,openai/gpt-oss-120b,together_ai,fix-ocaml-gc,13215,6046,19261,3852.052565,False,0.0,openai/gpt-oss-120b,fix-ocaml-gc,3852.052565,False,0.0,False,3852.052565 +1a9ba0d6-aab8-40ce-bc4d-d9e277f114d2,grok-4-0709,xai,feal-differential-cryptanalysis,2465,1496,3961,826.135716,True,1.0,grok-4-0709,feal-differential-cryptanalysis,826.135716,True,0.8,True,826.135716 +d1c3109b-e239-448e-8137-211b014cb004,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-differential-cryptanalysis,3976,2387,6363,965.669238,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-differential-cryptanalysis,965.669238,False,0.0,False,965.669238 +c40641fe-8ddf-48f0-94fe-59c0465eecbd,claude-sonnet-4-20250514,anthropic,torch-tensor-parallelism,4341,3040,7381,173.524139,False,0.0,claude-sonnet-4-20250514,torch-tensor-parallelism,173.524139,False,0.0,False,173.524139 +b0944d34-ea3f-4453-8fec-003053e20b08,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing,19462,19675,39137,1129.965242,False,0.0,deepseek-ai/DeepSeek-V3.1,path-tracing,1129.965242,False,0.0,False,1129.965242 +c470baf0-d1a3-452d-bb8e-cb4f1941b615,OpenAI/gpt-oss-20B,together_ai,model-extraction-relu-logits,489,477,966,27.105275,False,0.0,OpenAI/gpt-oss-20B,model-extraction-relu-logits,27.105275,False,0.0,False,27.105275 +9751ac0e-851c-46aa-9285-8305f9ff064f,claude-opus-4-1-20250805,anthropic,qemu-startup,3053,2005,5058,153.667311,False,0.0,claude-opus-4-1-20250805,qemu-startup,153.667311,False,0.4285714285714285,False,153.667311 +5c5e338a-cd06-4c00-9a96-2996381e18bf,deepseek-ai/DeepSeek-V3.1,together_ai,cobol-modernization,21709,19133,40842,779.133076,False,0.0,deepseek-ai/DeepSeek-V3.1,cobol-modernization,779.133076,False,0.6,False,779.133076 +8f18950b-6520-4516-9d58-e1a6f82cdc34,claude-opus-4-1-20250805,anthropic,fix-git,3100,1820,4920,140.710414,True,1.0,claude-opus-4-1-20250805,fix-git,140.710414,True,1.0,True,140.710414 +78b95d47-1386-41de-97ab-202a491962bd,OpenAI/gpt-oss-20B,together_ai,video-processing,1160,2531,3691,250.272492,False,0.0,OpenAI/gpt-oss-20B,video-processing,250.272492,False,0.0,False,250.272492 +4bc91b62-ce6a-4b2a-bb71-618424aa2c6c,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-with-gcov,15952,3368,19320,442.039122,True,1.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-with-gcov,442.039122,True,0.4,True,442.039122 +6896217d-dd24-4978-a10d-38b55a37fd4f,grok-code-fast-1,xai,password-recovery,5869,2873,8742,274.347955,False,0.0,grok-code-fast-1,password-recovery,274.347955,False,0.0,False,274.347955 +0fc82369-61f1-442e-bb17-a7046f9bc3c3,OpenAI/gpt-oss-20B,together_ai,prove-plus-comm,430,2365,2795,91.306081,False,0.0,OpenAI/gpt-oss-20B,prove-plus-comm,91.306081,False,0.0,False,91.306081 +f91c8df8-8dcc-4560-8428-117a80792864,claude-sonnet-4-20250514,anthropic,sqlite-with-gcov,11332,3933,15265,595.000597,False,0.0,claude-sonnet-4-20250514,sqlite-with-gcov,595.000597,False,0.2,False,595.000597 +78f0df05-f587-4a4d-8de2-56d0da1cf5fe,gpt-5-mini,openai,circuit-fibsqrt,29264,50254,79518,3605.750887,False,0.0,gpt-5-mini,circuit-fibsqrt,3605.750887,False,0.0,False,3605.750887 +6615f05e-c2ed-49b6-bf01-96a712db82df,deepseek-ai/DeepSeek-V3.1,together_ai,gpt2-codegolf,15040,14856,29896,903.040607,False,0.0,deepseek-ai/DeepSeek-V3.1,gpt2-codegolf,903.040607,False,0.0,False,903.040607 +df957d08-02e9-4bc0-acff-7610730cb2f5,OpenAI/gpt-oss-20B,together_ai,qemu-startup,1452,6097,7549,900.076557,False,0.0,OpenAI/gpt-oss-20B,qemu-startup,900.076557,False,0.0,False,900.076557 +81452652-ab8e-4c87-a3c6-47fc9ab257d2,OpenAI/gpt-oss-20B,together_ai,port-compressor,6151,30744,36895,413.329541,False,0.0,OpenAI/gpt-oss-20B,port-compressor,413.329541,False,0.0,False,413.329541 +d15453ca-0a5b-4980-92b8-d4ab222553fc,deepseek-ai/DeepSeek-V3.1,together_ai,pypi-server,12255,5447,17702,863.334157,False,0.0,deepseek-ai/DeepSeek-V3.1,pypi-server,863.334157,False,0.4,False,863.334157 +f2c36357-3159-4844-aabd-58c4159f957d,moonshotai/Kimi-K2-Instruct-0905,together_ai,filter-js-from-html,3638,3287,6925,746.395909,False,0.0,moonshotai/Kimi-K2-Instruct-0905,filter-js-from-html,746.395909,False,0.0,False,746.395909 +2df4eb12-2067-456e-a26f-da04b97a0445,gemini-2.5-flash,gemini,feal-linear-cryptanalysis,8304,6323,14627,657.466154,False,0.0,gemini-2.5-flash,feal-linear-cryptanalysis,657.466154,False,0.0,False,657.466154 +49185b8e-9a4a-4426-bd1e-2797344e2377,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,port-compressor,53971,30285,84256,3600.001877,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,port-compressor,3600.001877,False,0.0,False,3600.001877 +ad43c031-dbd6-4417-9e16-15c74eb7cd02,gemini-2.5-flash,gemini,install-klee-minimal,14893,2907,17800,906.371958,False,0.0,gemini-2.5-flash,install-klee-minimal,906.371958,False,0.0,False,906.371958 +6083b672-b030-41d8-bdf8-98b6801c2ab7,claude-sonnet-4-20250514,anthropic,prove-plus-comm,2615,2535,5150,489.077852,True,1.0,claude-sonnet-4-20250514,prove-plus-comm,489.077852,True,1.0,True,489.077852 +c86f2110-37fd-43a2-9bc4-d0259420da96,gemini-2.5-flash,gemini,bn-fit-modify,21420,39016,60436,3600.030334,False,0.0,gemini-2.5-flash,bn-fit-modify,3600.030334,False,0.0,False,3600.030334 +f0169179-6e40-4386-81c2-1224307f8109,openai/gpt-oss-120b,together_ai,qemu-startup,1575,1086,2661,710.100094,False,0.0,openai/gpt-oss-120b,qemu-startup,710.100094,False,0.0,False,710.100094 +152e4a54-47e2-4cfc-af48-5eef0432d035,openai/gpt-oss-120b,together_ai,form-filling,11557,8634,20191,455.258407,True,1.0,openai/gpt-oss-120b,form-filling,455.258407,True,0.6,True,455.258407 +36736c49-f973-4f04-a4d6-0f70f8b434da,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,prove-plus-comm,1934,2611,4545,421.592904,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,prove-plus-comm,421.592904,False,0.2,False,421.592904 +57191ccb-e58b-4421-a92e-49d6b0220b21,gemini-2.5-pro,gemini,distribution-search,10597,10688,21285,641.21183,True,1.0,gemini-2.5-pro,distribution-search,641.21183,True,0.6,True,641.21183 +0ed143cf-2262-4005-91b6-c1d20a078995,gemini-2.5-pro,gemini,sqlite-db-truncate,4785,2120,6905,357.585043,False,0.0,gemini-2.5-pro,sqlite-db-truncate,357.585043,False,0.0,False,357.585043 +6e1012e9-d93a-4f4e-afcb-485424525ae2,OpenAI/gpt-oss-20B,together_ai,git-leak-recovery,587,1386,1973,159.565248,False,0.0,OpenAI/gpt-oss-20B,git-leak-recovery,159.565248,False,0.0,False,159.565248 +b00e4c95-d8c4-4385-b8aa-724252409d4a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,code-from-image,5776,1525,7301,185.486745,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,code-from-image,185.486745,False,0.4,False,185.486745 +f6b71d70-b7c6-4606-9b5a-48a07c0f8635,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-insert,6947,2569,9516,554.977483,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-insert,554.977483,False,0.0,False,554.977483 +e317f8df-d9d0-4d85-ad81-ff38b60a451e,gpt-5-mini,openai,large-scale-text-editing,9054,5901,14955,1200.02821,True,1.0,gpt-5-mini,large-scale-text-editing,1200.02821,True,0.2,True,1200.02821 +f92162b0-9993-4fa1-bdbf-6388fc8c7f6b,claude-opus-4-1-20250805,anthropic,sanitize-git-repo,14985,3968,18953,457.052309,False,0.0,claude-opus-4-1-20250805,sanitize-git-repo,457.052309,False,0.0,False,457.052309 +edfb2ef8-16b5-467d-bd17-21336d7b113d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-differential-cryptanalysis,19948,12963,32911,468.020863,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-differential-cryptanalysis,468.020863,False,0.0,False,468.020863 +d3f409e7-2c2c-4af2-85fc-462581211307,OpenAI/gpt-oss-20B,together_ai,make-doom-for-mips,1991,4034,6025,350.095345,False,0.0,OpenAI/gpt-oss-20B,make-doom-for-mips,350.095345,False,0.0,False,350.095345 +66acf2b0-01fb-44de-a29c-d1f341c79995,claude-sonnet-4-20250514,anthropic,circuit-fibsqrt,18528,18815,37343,1212.977427,False,0.0,claude-sonnet-4-20250514,circuit-fibsqrt,1212.977427,False,0.0,False,1212.977427 +eca79125-88db-4820-a3e2-af90f96ae8d8,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-leaderboard,20960,9288,30248,1342.634596,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-leaderboard,1342.634596,False,0.0,False,1342.634596 +2d94f936-7b6a-4114-9f4e-efdba474f2c7,claude-opus-4-1-20250805,anthropic,cobol-modernization,19965,14472,34437,904.295166,True,1.0,claude-opus-4-1-20250805,cobol-modernization,904.295166,True,0.875,True,904.295166 +3fab5d00-5e53-4e88-99fd-c5e220b7c866,grok-4-0709,xai,largest-eigenval,9306,3461,12767,913.75097,False,0.0,grok-4-0709,largest-eigenval,913.75097,False,0.0,False,913.75097 +4a7d9634-bd75-4a1f-887d-f2e90f5769c7,gemini-2.5-flash,gemini,sqlite-with-gcov,9522,1930,11452,529.576716,False,0.0,gemini-2.5-flash,sqlite-with-gcov,529.576716,False,0.2,False,529.576716 +9bd077b3-0c98-40ba-9db8-c3f042dca5ba,gemini-2.5-pro,gemini,nginx-request-logging,3709,1320,5029,290.799818,False,0.0,gemini-2.5-pro,nginx-request-logging,290.799818,False,0.6,False,290.799818 +6b3efbe6-cfe3-4ad1-a0cf-d2c822395dae,gpt-5,openai,nginx-request-logging,4521,1394,5915,193.951082,True,1.0,gpt-5,nginx-request-logging,193.951082,True,1.0,True,193.951082 +78c8ff98-65e7-49bb-be76-7527e43dedf7,claude-sonnet-4-20250514,anthropic,sqlite-with-gcov,10975,2513,13488,362.022982,True,1.0,claude-sonnet-4-20250514,sqlite-with-gcov,362.022982,True,0.2,True,362.022982 +a7167d17-ee02-404b-b27a-fb286dee49a6,OpenAI/gpt-oss-20B,together_ai,mteb-leaderboard,202,717,919,337.763497,False,0.0,OpenAI/gpt-oss-20B,mteb-leaderboard,337.763497,False,0.0,False,337.763497 +07713ad8-d4e0-4a7d-bfa9-ecc24dc5c356,gemini-2.5-flash,gemini,code-from-image,5537,10291,15828,1200.001559,False,0.0,gemini-2.5-flash,code-from-image,1200.001559,False,0.4,False,1200.001559 +9ee6a853-0115-4891-a482-163cccd25060,OpenAI/gpt-oss-20B,together_ai,model-extraction-relu-logits,2044,2038,4082,123.24147,False,0.0,OpenAI/gpt-oss-20B,model-extraction-relu-logits,123.24147,False,0.0,False,123.24147 +8be099ba-c0ed-49a9-ad52-e0985226337b,gemini-2.5-flash,gemini,gpt2-codegolf,2810,2774,5584,219.296895,False,0.0,gemini-2.5-flash,gpt2-codegolf,219.296895,False,0.0,False,219.296895 +86585e68-632e-4ea5-8fe0-f1e7674894fc,OpenAI/gpt-oss-20B,together_ai,pytorch-model-cli,548,1371,1919,73.313045,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-cli,73.313045,False,0.0,False,73.313045 +324c3702-7add-4ca9-9e24-7acbfa13fb4b,claude-opus-4-1-20250805,anthropic,make-mips-interpreter,30349,28444,58793,1801.350194,False,0.0,claude-opus-4-1-20250805,make-mips-interpreter,1801.350194,False,0.0,False,1801.350194 +10c49c67-5897-4bfd-9d09-b0b5afdfd329,deepseek-ai/DeepSeek-V3.1,together_ai,reverse-engineering,12332,6130,18462,496.798506,True,1.0,deepseek-ai/DeepSeek-V3.1,reverse-engineering,496.798506,True,0.2,True,496.798506 +0fb02eae-38a9-4240-8a87-a5e4280652c5,grok-code-fast-1,xai,prove-plus-comm,1473,2527,4000,179.639355,False,0.0,grok-code-fast-1,prove-plus-comm,179.639355,False,0.4,False,179.639355 +9a79396a-1977-420d-83f7-de94cbe1967f,deepseek-ai/DeepSeek-V3.1,together_ai,feal-linear-cryptanalysis,15634,24298,39932,1808.716178,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-linear-cryptanalysis,1808.716178,False,0.0,False,1808.716178 +e3d8f8d3-1789-4e6b-874c-61483ca81b7b,claude-opus-4-1-20250805,anthropic,dna-insert,18326,10660,28986,360.001079,False,0.0,claude-opus-4-1-20250805,dna-insert,360.001079,False,0.0,False,360.001079 +0da7b865-1d9c-4053-b255-4dd77faa2e1c,grok-code-fast-1,xai,path-tracing-reverse,3104,2526,5630,210.562781,False,0.0,grok-code-fast-1,path-tracing-reverse,210.562781,False,0.0,False,210.562781 +fa533879-633f-44e4-9beb-0367d85fb7a2,gemini-2.5-pro,gemini,mteb-leaderboard,35216,15056,50272,3619.546331,False,0.0,gemini-2.5-pro,mteb-leaderboard,3619.546331,False,0.0,False,3619.546331 +70791c6c-9952-497b-a547-c92af3f188d8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-leaderboard,13718,3331,17049,509.635021,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-leaderboard,509.635021,False,0.0,False,509.635021 +36b1a6c3-b6ec-4584-8b61-56df6d401b2a,gpt-5,openai,build-pmars,7755,2915,10670,569.860484,True,1.0,gpt-5,build-pmars,569.860484,True,0.8,True,569.860484 +3573c70c-9740-4872-961b-6f84a624b0a2,zai-org/GLM-4.5-Air-FP8,together_ai,log-summary-date-ranges,7810,3058,10868,131.317284,True,1.0,zai-org/GLM-4.5-Air-FP8,log-summary-date-ranges,131.317284,True,0.8,True,131.317284 +6de63371-e49b-4bf4-b955-a4adf5ac9169,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,db-wal-recovery,3079,3566,6645,940.987152,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,db-wal-recovery,940.987152,False,0.0,False,940.987152 +4ad46ed6-f07e-41b7-abcc-0950a6af8b2a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,adaptive-rejection-sampler,10997,9141,20138,902.045639,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,adaptive-rejection-sampler,902.045639,False,0.0,False,902.045639 +f83bb266-d229-493b-af2f-7706a9625baa,gemini-2.5-flash,gemini,write-compressor,5587,24872,30459,900.214951,False,0.0,gemini-2.5-flash,write-compressor,900.214951,False,0.0,False,900.214951 +f9640edb-8613-4300-8701-477c0512c7b0,grok-4-0709,xai,financial-document-processor,6930,2657,9587,501.25845,False,0.0,grok-4-0709,financial-document-processor,501.25845,False,0.0,False,501.25845 +b5633c60-56d3-4f50-b097-4d8f6daaaab6,gpt-5-nano,openai,polyglot-rust-c,8690,10674,19364,900.140924,False,0.0,gpt-5-nano,polyglot-rust-c,900.140924,False,0.0,False,900.140924 +fa2edbb9-a728-4af7-b0c9-10093ded35b1,claude-sonnet-4-20250514,anthropic,vulnerable-secret,3533,4622,8155,906.159663,False,0.0,claude-sonnet-4-20250514,vulnerable-secret,906.159663,False,0.0,False,906.159663 +00d2059e-bc80-4347-bb40-9ff7a14e1300,claude-opus-4-1-20250805,anthropic,sqlite-db-truncate,7407,5464,12871,428.757811,False,0.0,claude-opus-4-1-20250805,sqlite-db-truncate,428.757811,False,0.125,False,428.757811 +225291d5-e73d-4a74-9d07-962b43a3bb10,openai/gpt-oss-120b,together_ai,cancel-async-tasks,1262,583,1845,24.594396,True,1.0,openai/gpt-oss-120b,cancel-async-tasks,24.594396,True,0.6,True,24.594396 +319b341e-2566-4d2f-9691-c36d6122e1b4,gemini-2.5-pro,gemini,cancel-async-tasks,1296,636,1932,91.491076,False,0.0,gemini-2.5-pro,cancel-async-tasks,91.491076,False,0.0,False,91.491076 +67ca3e36-deeb-43d0-b3b8-a4642d191ef8,gemini-2.5-pro,gemini,build-initramfs-qemu,8462,4020,12482,900.644562,False,0.0,gemini-2.5-pro,build-initramfs-qemu,900.644562,False,0.0,False,900.644562 +3b0fcfda-e096-4c3a-81ca-ab7b74de3f11,claude-sonnet-4-20250514,anthropic,polyglot-c-py,3849,4225,8074,243.673757,False,0.0,claude-sonnet-4-20250514,polyglot-c-py,243.673757,False,0.0,False,243.673757 +c6db3522-30a1-4c34-ae7d-d1f85dc74cd7,claude-opus-4-1-20250805,anthropic,make-doom-for-mips,22482,7941,30423,900.001982,False,0.0,claude-opus-4-1-20250805,make-doom-for-mips,900.001982,False,0.0,False,900.001982 +901e125f-f6c2-448d-abb4-e68ec54b135c,OpenAI/gpt-oss-20B,together_ai,filter-js-from-html,1893,5830,7723,312.836902,False,0.0,OpenAI/gpt-oss-20B,filter-js-from-html,312.836902,False,0.0,False,312.836902 +9b9db535-975e-4280-b7ac-1467f1351b92,deepseek-ai/DeepSeek-V3.1,together_ai,circuit-fibsqrt,8588,8478,17066,1024.611893,False,0.0,deepseek-ai/DeepSeek-V3.1,circuit-fibsqrt,1024.611893,False,0.0,False,1024.611893 +4cf44c0c-500b-4e52-ab57-70ed854d001e,claude-opus-4-1-20250805,anthropic,constraints-scheduling,5500,3823,9323,379.176898,True,1.0,claude-opus-4-1-20250805,constraints-scheduling,379.176898,True,0.8888888888888888,True,379.176898 +bae64056-e81b-4a90-91f0-2550c3b16c62,claude-opus-4-1-20250805,anthropic,path-tracing-reverse,45525,33757,79282,1800.001176,False,0.0,claude-opus-4-1-20250805,path-tracing-reverse,1800.001176,False,0.0,False,1800.001176 +c2f65f40-7989-4c11-b809-9bd92f8e882e,gpt-5,openai,log-summary-date-ranges,5595,1544,7139,140.757486,False,0.0,gpt-5,log-summary-date-ranges,140.757486,False,0.0,False,140.757486 +640941e1-b733-4c6d-a7b6-0c509318dd4c,gpt-5-mini,openai,distribution-search,2323,1931,4254,297.626007,True,1.0,gpt-5-mini,distribution-search,297.626007,True,1.0,True,297.626007 +27aa0684-23e7-4576-bc2a-a6bde44cba1a,claude-sonnet-4-20250514,anthropic,install-windows-3.11,9434,4100,13534,1377.737715,False,0.0,claude-sonnet-4-20250514,install-windows-3.11,1377.737715,False,0.0,False,1377.737715 +2f0ede3d-11aa-4de1-acef-e9c6adbb2d8a,gpt-5-nano,openai,sqlite-db-truncate,8190,6200,14390,566.002901,False,0.0,gpt-5-nano,sqlite-db-truncate,566.002901,False,0.0,False,566.002901 +ac806f83-435c-4263-a6d1-f5cde8caea93,OpenAI/gpt-oss-20B,together_ai,mteb-leaderboard,923,245,1168,32.60288,False,0.0,OpenAI/gpt-oss-20B,mteb-leaderboard,32.60288,False,0.0,False,32.60288 +b2a74ab0-ebb0-4e5d-a07a-2797d666e93c,gpt-5-nano,openai,pytorch-model-cli,3474,3332,6806,397.23751,False,0.0,gpt-5-nano,pytorch-model-cli,397.23751,False,0.0,False,397.23751 +43009783-ed25-4a4f-a6f8-e484af7ec17b,zai-org/GLM-4.5-Air-FP8,together_ai,feal-differential-cryptanalysis,5434,4547,9981,253.085367,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-differential-cryptanalysis,253.085367,False,0.0,False,253.085367 +3c45ac9c-e7a5-4b8e-98f9-8a5861ef26ec,gemini-2.5-flash,gemini,large-scale-text-editing,2652,1646,4298,241.052288,False,0.0,gemini-2.5-flash,large-scale-text-editing,241.052288,False,0.0,False,241.052288 +f3fd64ee-c6da-4daf-b4e9-10bda5a18f58,zai-org/GLM-4.5-Air-FP8,together_ai,break-filter-js-from-html,3544,4694,8238,340.818113,False,0.0,zai-org/GLM-4.5-Air-FP8,break-filter-js-from-html,340.818113,False,0.0,False,340.818113 +9ca2a341-893f-412c-a423-c4d6cd8c16bb,claude-opus-4-1-20250805,anthropic,feal-differential-cryptanalysis,29722,33888,63610,1800.001022,False,0.0,claude-opus-4-1-20250805,feal-differential-cryptanalysis,1800.001022,False,0.0,False,1800.001022 +bc78da9d-0314-4fb1-820c-81b24a09f2ac,gpt-5-mini,openai,break-filter-js-from-html,2666,1280,3946,170.990975,False,0.0,gpt-5-mini,break-filter-js-from-html,170.990975,False,0.0,False,170.990975 +e583ab23-4f8b-4ea4-9cb6-b84fce1973d8,openai/gpt-oss-120b,together_ai,filter-js-from-html,1348,755,2103,14.817925,False,0.0,openai/gpt-oss-120b,filter-js-from-html,14.817925,False,0.0,False,14.817925 +a1968094-28ed-479f-b65a-3053caf0afb5,OpenAI/gpt-oss-20B,together_ai,write-compressor,2297,5973,8270,904.365829,False,0.0,OpenAI/gpt-oss-20B,write-compressor,904.365829,False,0.0,False,904.365829 +a01bedaf-0430-4429-b7c5-12f4a8a8206d,deepseek-ai/DeepSeek-V3.1,together_ai,financial-document-processor,11360,5294,16654,424.338483,False,0.0,deepseek-ai/DeepSeek-V3.1,financial-document-processor,424.338483,False,0.0,False,424.338483 +3e244d06-820d-4147-836e-d007dac9cc59,gemini-2.5-pro,gemini,financial-document-processor,9074,3575,12649,531.094791,False,0.0,gemini-2.5-pro,financial-document-processor,531.094791,False,0.0,False,531.094791 +10a98bb8-8450-48b0-a062-1703ff8840c9,claude-opus-4-1-20250805,anthropic,dna-assembly,26188,20451,46639,624.445139,False,0.0,claude-opus-4-1-20250805,dna-assembly,624.445139,False,0.0,False,624.445139 +568e5d2b-7dcd-48c1-b46c-9236bf862ad0,zai-org/GLM-4.5-Air-FP8,together_ai,largest-eigenval,3387,2645,6032,900.849507,False,0.0,zai-org/GLM-4.5-Air-FP8,largest-eigenval,900.849507,False,0.0,False,900.849507 +3f96f923-505b-417b-ba4c-db87355276a3,OpenAI/gpt-oss-20B,together_ai,bn-fit-modify,424,2950,3374,138.079409,False,0.0,OpenAI/gpt-oss-20B,bn-fit-modify,138.079409,False,0.0,False,138.079409 +5a9d07ee-1578-4478-ab8d-a7f6ed0ed766,claude-opus-4-1-20250805,anthropic,install-klee-minimal,10184,1760,11944,900.136276,False,0.0,claude-opus-4-1-20250805,install-klee-minimal,900.136276,False,0.0,False,900.136276 +79693a76-7347-42f5-a9d1-4e6e14e72f61,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,code-from-image,12371,10002,22373,991.873763,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,code-from-image,991.873763,False,0.2,False,991.873763 +e002ea60-df41-428f-a2e1-ffca3abe586c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,run-pdp11-code,6419,1789,8208,181.911207,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,run-pdp11-code,181.911207,False,0.0,False,181.911207 +e4cb414c-e754-4e3d-82cf-23616d20a6dc,gemini-2.5-flash,gemini,feal-differential-cryptanalysis,4320,13264,17584,273.586965,False,0.0,gemini-2.5-flash,feal-differential-cryptanalysis,273.586965,False,0.2,False,273.586965 +fb93a8a2-b71b-41f3-a598-0828b59b9855,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cobol-modernization,9172,4583,13755,678.953582,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cobol-modernization,678.953582,False,0.0,False,678.953582 +c95b07d2-7d0b-4d82-bc82-039d5c129240,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,gpt2-codegolf,1633,1931,3564,157.378371,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,gpt2-codegolf,157.378371,False,0.0,False,157.378371 +3c39cdce-39e3-491c-9c4a-e35bb122b626,gpt-5,openai,tune-mjcf,8693,5062,13755,905.418281,False,0.0,gpt-5,tune-mjcf,905.418281,False,0.0,False,905.418281 +b2473772-5749-4e59-a09e-1f8fb863711c,grok-code-fast-1,xai,distribution-search,3096,2896,5992,415.286067,False,0.0,grok-code-fast-1,distribution-search,415.286067,False,0.0,False,415.286067 +b946042c-892a-4d99-bb60-22302b1bff63,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,code-from-image,5019,828,5847,36.479159,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,code-from-image,36.479159,True,0.4,True,36.479159 +7581e486-f025-4d2a-a95f-4628a3e0c9f2,claude-sonnet-4-20250514,anthropic,password-recovery,3629,4205,7834,900.000618,True,1.0,claude-sonnet-4-20250514,password-recovery,900.000618,True,0.4,True,900.000618 +3ae940eb-4526-43c7-8ae0-64992c03d6e2,gpt-5-nano,openai,dna-insert,4138,6584,10722,365.536655,False,0.0,gpt-5-nano,dna-insert,365.536655,False,0.0,False,365.536655 +dbeaa5ee-5fbf-4e66-aab3-219ad58bfe1e,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-alpine-ssh,3181,4255,7436,903.037901,False,0.0,moonshotai/Kimi-K2-Instruct-0905,qemu-alpine-ssh,903.037901,False,0.0,False,903.037901 +0312a306-010b-4f77-8283-e0ab629e35fc,gpt-5,openai,reverse-engineering,31998,7045,39043,1139.728573,True,1.0,gpt-5,reverse-engineering,1139.728573,True,0.6666666666666666,True,1139.728573 +43fd16c4-d907-46a8-90cf-7c75e1323de9,gpt-5-nano,openai,reshard-c4-data,8626,7997,16623,454.477631,False,0.0,gpt-5-nano,reshard-c4-data,454.477631,False,0.0,False,454.477631 +a28b88cf-dd7c-48b8-8cb9-303aa3ede905,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-rust-c,8548,9667,18215,969.394023,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-rust-c,969.394023,False,0.0,False,969.394023 +49d27d7b-c31b-404d-8dc0-10304583cfa9,OpenAI/gpt-oss-20B,together_ai,install-klee-minimal,5302,17201,22503,912.707267,False,0.0,OpenAI/gpt-oss-20B,install-klee-minimal,912.707267,False,0.0,False,912.707267 +4e980c1c-bc29-4a88-a52c-2d2e2b3a4c0f,openai/gpt-oss-120b,together_ai,openssl-selfsigned-cert,1720,952,2672,55.749684,True,1.0,openai/gpt-oss-120b,openssl-selfsigned-cert,55.749684,True,0.8,True,55.749684 +02ae6604-753c-4223-9a00-e37ef33b9b7e,gpt-5-nano,openai,feal-differential-cryptanalysis,4073,4194,8267,656.719255,False,0.0,gpt-5-nano,feal-differential-cryptanalysis,656.719255,False,0.0,False,656.719255 +a2f0f358-ecd2-4984-bb18-f682b13b2a26,zai-org/GLM-4.5-Air-FP8,together_ai,regex-log,1164,3292,4456,271.495067,False,0.0,zai-org/GLM-4.5-Air-FP8,regex-log,271.495067,False,0.2,False,271.495067 +d3aac658-dcd2-4c5b-a20d-318c6881e5c4,OpenAI/gpt-oss-20B,together_ai,dna-assembly,168,637,805,72.249329,False,0.0,OpenAI/gpt-oss-20B,dna-assembly,72.249329,False,0.0,False,72.249329 +35726627-9bc4-45a5-8853-9782bb718b99,gemini-2.5-pro,gemini,cobol-modernization,5699,4035,9734,343.081688,True,1.0,gemini-2.5-pro,cobol-modernization,343.081688,True,1.0,True,343.081688 +0593056a-8060-43e3-a9ef-66e912f11d26,grok-4-0709,xai,install-windows-3.11,5434,2209,7643,1168.214581,False,0.0,grok-4-0709,install-windows-3.11,1168.214581,False,0.0,False,1168.214581 +3e75a1dc-6a8e-4009-a673-542bcf460d83,deepseek-ai/DeepSeek-V3.1,together_ai,reshard-c4-data,6217,2728,8945,253.422488,False,0.0,deepseek-ai/DeepSeek-V3.1,reshard-c4-data,253.422488,False,0.0,False,253.422488 +fd2ea1f1-05ec-406a-ade7-8934683ce679,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,circuit-fibsqrt,12162,12913,25075,1050.939795,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,circuit-fibsqrt,1050.939795,False,0.0,False,1050.939795 +207b34fd-80d1-41f7-8624-6ef0b7f0dc72,gpt-5-mini,openai,cancel-async-tasks,2584,1558,4142,439.725406,False,0.0,gpt-5-mini,cancel-async-tasks,439.725406,False,0.4,False,439.725406 +4161c192-3809-4bd8-958e-d3c8236c3d4c,OpenAI/gpt-oss-20B,together_ai,polyglot-c-py,536,624,1160,156.678424,False,0.0,OpenAI/gpt-oss-20B,polyglot-c-py,156.678424,False,0.0,False,156.678424 +91184ff6-ac6f-4fcd-9eaf-ccd93ba8e9f5,OpenAI/gpt-oss-20B,together_ai,sqlite-with-gcov,1242,2669,3911,192.055478,False,0.0,OpenAI/gpt-oss-20B,sqlite-with-gcov,192.055478,False,0.0,False,192.055478 +1441cf57-e3c0-4c64-8093-b9fbf698a10b,gpt-5,openai,largest-eigenval,5614,6878,12492,900.088639,False,0.0,gpt-5,largest-eigenval,900.088639,False,0.0,False,900.088639 +e8f20704-2040-40dc-bf5d-37ef477c3b60,OpenAI/gpt-oss-20B,together_ai,polyglot-rust-c,231,2068,2299,324.601154,False,0.0,OpenAI/gpt-oss-20B,polyglot-rust-c,324.601154,False,0.0,False,324.601154 +a2634787-a53f-4c61-a5cf-f66a9c524ee7,claude-opus-4-1-20250805,anthropic,build-pmars,9069,2544,11613,216.313743,True,1.0,claude-opus-4-1-20250805,build-pmars,216.313743,True,0.5,True,216.313743 +0e10cbd2-d2d5-45ea-bbfe-d51cb746b91a,claude-opus-4-1-20250805,anthropic,log-summary-date-ranges,7690,2068,9758,87.704572,True,1.0,claude-opus-4-1-20250805,log-summary-date-ranges,87.704572,True,0.8888888888888888,True,87.704572 +868da0d2-e226-4448-acb9-168cabbf341d,zai-org/GLM-4.5-Air-FP8,together_ai,merge-diff-arc-agi-task,13386,4920,18306,231.623286,False,0.0,zai-org/GLM-4.5-Air-FP8,merge-diff-arc-agi-task,231.623286,False,0.0,False,231.623286 +d65c207d-655b-4b0b-a5db-bc54a871abc4,gpt-5,openai,dna-assembly,14353,13245,27598,720.031722,False,0.0,gpt-5,dna-assembly,720.031722,False,0.0,False,720.031722 +0e5c2e18-c22e-49ce-8da9-b452f91ab55e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-retrieve,2323,1262,3585,189.050685,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-retrieve,189.050685,False,0.0,False,189.050685 +13de0ee6-dd4d-4fb9-b751-6d1e7955403e,zai-org/GLM-4.5-Air-FP8,together_ai,make-mips-interpreter,37488,29319,66807,1323.677248,False,0.0,zai-org/GLM-4.5-Air-FP8,make-mips-interpreter,1323.677248,False,0.0,False,1323.677248 +6e7bf554-2aac-4171-80ae-c1a60f52c095,openai/gpt-oss-120b,together_ai,polyglot-c-py,916,1240,2156,178.844767,False,0.0,openai/gpt-oss-120b,polyglot-c-py,178.844767,False,0.0,False,178.844767 +bd049ae5-a453-44cf-9d94-ff498d27a67a,openai/gpt-oss-120b,together_ai,model-extraction-relu-logits,1664,683,2347,76.035923,False,0.0,openai/gpt-oss-120b,model-extraction-relu-logits,76.035923,False,0.0,False,76.035923 +255fb8f0-e178-47af-8b10-220b12f925d3,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-initramfs-qemu,1350,943,2293,59.102325,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-initramfs-qemu,59.102325,False,0.0,False,59.102325 +cd9a98f2-458b-485b-b83b-91fab1989bc3,openai/gpt-oss-120b,together_ai,sqlite-with-gcov,1149,829,1978,241.021303,True,1.0,openai/gpt-oss-120b,sqlite-with-gcov,241.021303,True,0.8,True,241.021303 +d78235e2-f26c-426e-8a05-31ff921c5021,claude-opus-4-1-20250805,anthropic,mteb-leaderboard,1708,1495,3203,116.844017,False,0.0,claude-opus-4-1-20250805,mteb-leaderboard,116.844017,False,0.0,False,116.844017 +cfff69ab-a6f0-481d-9b87-b97201fe2019,claude-opus-4-1-20250805,anthropic,qemu-startup,2010,1421,3431,963.542424,False,0.0,claude-opus-4-1-20250805,qemu-startup,963.542424,False,0.4285714285714285,False,963.542424 +dbf4a7b2-52ab-4ef6-8f54-b82966dd3bc8,claude-sonnet-4-20250514,anthropic,bn-fit-modify,15398,8716,24114,2270.286565,False,0.0,claude-sonnet-4-20250514,bn-fit-modify,2270.286565,False,0.8,False,2270.286565 +e3847b5a-5852-4d7b-9afa-1284763c6f05,zai-org/GLM-4.5-Air-FP8,together_ai,video-processing,2853,2555,5408,161.489294,False,0.0,zai-org/GLM-4.5-Air-FP8,video-processing,161.489294,False,0.0,False,161.489294 +e33a5b98-49ca-4c9e-a02c-48a3a278d976,claude-opus-4-1-20250805,anthropic,filter-js-from-html,20999,19222,40221,909.1637,False,0.0,claude-opus-4-1-20250805,filter-js-from-html,909.1637,False,0.0,False,909.1637 +674ca55c-5d16-41e2-8feb-00222cb89955,claude-opus-4-1-20250805,anthropic,polyglot-rust-c,17291,15865,33156,914.193253,False,0.0,claude-opus-4-1-20250805,polyglot-rust-c,914.193253,False,0.0,False,914.193253 +58b0e2fb-6981-476a-8664-4ae1db2569d2,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pmars,20988,7739,28727,565.936369,True,1.0,moonshotai/Kimi-K2-Instruct-0905,build-pmars,565.936369,True,0.8,True,565.936369 +274d8dd5-1bcf-4e85-9a23-e960479a9d73,gpt-5,openai,path-tracing,16305,16089,32394,1802.085791,False,0.0,gpt-5,path-tracing,1802.085791,False,0.0,False,1802.085791 +fcd53fec-4fb7-486a-827b-719e3f5ce8cc,deepseek-ai/DeepSeek-V3.1,together_ai,install-windows-3.11,16766,9594,26360,960.011897,False,0.0,deepseek-ai/DeepSeek-V3.1,install-windows-3.11,960.011897,False,0.0,False,960.011897 +e315bb79-60bf-451f-a47d-0622529a8ac6,gpt-5,openai,circuit-fibsqrt,19086,35166,54252,2780.124129,True,1.0,gpt-5,circuit-fibsqrt,2780.124129,True,0.6666666666666666,True,2780.124129 +534db045-118e-4154-aab6-503de0e6d2c2,openai/gpt-oss-120b,together_ai,schemelike-metacircular-eval,6670,3291,9961,277.201498,False,0.0,openai/gpt-oss-120b,schemelike-metacircular-eval,277.201498,False,0.0,False,277.201498 +68cdc892-e64f-4900-a868-cd1783c29052,OpenAI/gpt-oss-20B,together_ai,pytorch-model-recovery,2235,7033,9268,909.177927,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-recovery,909.177927,False,0.0,False,909.177927 +d9dafa1c-e162-4448-a732-d1ef9696edf0,gpt-5-mini,openai,build-cython-ext,9283,7096,16379,900.469947,False,0.0,gpt-5-mini,build-cython-ext,900.469947,False,0.2,False,900.469947 +82b5839d-886d-40b5-a852-1653cdec6b06,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,tune-mjcf,11744,12119,23863,900.150001,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,tune-mjcf,900.150001,False,0.0,False,900.150001 +e9a59387-1fcd-434b-bf47-ee3835be3fd8,OpenAI/gpt-oss-20B,together_ai,build-initramfs-qemu,1242,2004,3246,47.463443,False,0.0,OpenAI/gpt-oss-20B,build-initramfs-qemu,47.463443,False,0.0,False,47.463443 +43e5e073-eb9c-4642-ab77-b78613892852,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,password-recovery,2337,2473,4810,187.252973,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,password-recovery,187.252973,False,0.0,False,187.252973 +8c817bdf-e271-409e-ac30-a0178c7455bb,claude-sonnet-4-20250514,anthropic,feal-differential-cryptanalysis,21608,19260,40868,1386.949371,False,0.0,claude-sonnet-4-20250514,feal-differential-cryptanalysis,1386.949371,False,0.0,False,1386.949371 +d2cb35a7-181d-4335-bc70-a9906dde9e7d,grok-code-fast-1,xai,build-cython-ext,7787,2937,10724,908.508152,False,0.0,grok-code-fast-1,build-cython-ext,908.508152,False,0.0,False,908.508152 +9a90c6c3-aa44-41d3-80a0-dfd2f4b3d7d4,zai-org/GLM-4.5-Air-FP8,together_ai,make-doom-for-mips,16639,3822,20461,904.808309,False,0.0,zai-org/GLM-4.5-Air-FP8,make-doom-for-mips,904.808309,False,0.0,False,904.808309 +9dd17647-8349-464f-b183-4d543bfb4e7a,deepseek-ai/DeepSeek-V3.1,together_ai,dna-insert,7609,3737,11346,631.8803,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-insert,631.8803,False,0.0,False,631.8803 +9b7621f6-5cda-4e2b-bfdb-27719499abc8,zai-org/GLM-4.5-Air-FP8,together_ai,fix-git,4008,2597,6605,241.068161,True,1.0,zai-org/GLM-4.5-Air-FP8,fix-git,241.068161,True,0.6,True,241.068161 +9487c006-b3f3-46f5-aa58-db961dd0798e,moonshotai/Kimi-K2-Instruct-0905,together_ai,hf-model-inference,4684,2598,7282,918.51472,False,0.0,moonshotai/Kimi-K2-Instruct-0905,hf-model-inference,918.51472,False,0.0,False,918.51472 +f0d343fb-6ea9-4a4a-a397-21ae4bfdc84c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,financial-document-processor,9152,2096,11248,87.426206,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,financial-document-processor,87.426206,False,0.0,False,87.426206 +72afd092-4dc5-49fa-b4df-e19476df99db,claude-sonnet-4-20250514,anthropic,video-processing,7895,6236,14131,505.344073,False,0.0,claude-sonnet-4-20250514,video-processing,505.344073,False,0.0,False,505.344073 +55130153-64f3-4944-b1d7-811b02dbb23f,grok-4-0709,xai,bn-fit-modify,13677,5702,19379,1829.417233,True,1.0,grok-4-0709,bn-fit-modify,1829.417233,True,0.6,True,1829.417233 +e65cb80e-d306-4c06-bd34-3cebb703917a,gpt-5-mini,openai,cobol-modernization,5439,3918,9357,494.87513,True,1.0,gpt-5-mini,cobol-modernization,494.87513,True,1.0,True,494.87513 +31092841-cbf3-4b2a-9d67-b83c6529933b,gemini-2.5-flash,gemini,fix-code-vulnerability,4675,3177,7852,949.079368,False,0.0,gemini-2.5-flash,fix-code-vulnerability,949.079368,False,0.0,False,949.079368 +4754ee4b-a5b3-47a4-a6c6-1dda46b46f68,gpt-5-mini,openai,polyglot-rust-c,8324,5572,13896,901.168655,False,0.0,gpt-5-mini,polyglot-rust-c,901.168655,False,0.0,False,901.168655 +a1a72053-dd64-4a8d-a0b9-183457c38182,gpt-5,openai,dna-insert,961,4301,5262,380.107128,False,0.0,gpt-5,dna-insert,380.107128,False,0.0,False,380.107128 +59e6fd84-ac60-4260-b93e-6425f778a558,gpt-5,openai,make-doom-for-mips,10602,5616,16218,900.659976,False,0.0,gpt-5,make-doom-for-mips,900.659976,False,0.0,False,900.659976 +9c6e739d-7605-45bb-b01d-ee01a4df663f,OpenAI/gpt-oss-20B,together_ai,polyglot-c-py,214,957,1171,87.36403,False,0.0,OpenAI/gpt-oss-20B,polyglot-c-py,87.36403,False,0.0,False,87.36403 +b3fe8586-e0be-4bbd-8c17-ebb4a4e957fb,deepseek-ai/DeepSeek-V3.1,together_ai,feal-linear-cryptanalysis,32211,28535,60746,1808.088625,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-linear-cryptanalysis,1808.088625,False,0.0,False,1808.088625 +397aac9a-b375-4a5e-83ad-2d4fbb006123,gpt-5-nano,openai,run-pdp11-code,6972,6527,13499,1000.023488,False,0.0,gpt-5-nano,run-pdp11-code,1000.023488,False,0.0,False,1000.023488 +eebed711-648d-4af0-b7f9-96286ddd4442,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cancel-async-tasks,2408,1840,4248,241.723907,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cancel-async-tasks,241.723907,True,0.6,True,241.723907 +3ab4d380-e5db-4593-8bb0-3fe373d180a2,zai-org/GLM-4.5-Air-FP8,together_ai,torch-tensor-parallelism,1892,1632,3524,26.359132,False,0.0,zai-org/GLM-4.5-Air-FP8,torch-tensor-parallelism,26.359132,False,0.0,False,26.359132 +e32f9fe1-5b8a-45be-9a7b-03e466bfe776,claude-opus-4-1-20250805,anthropic,log-summary-date-ranges,7878,1885,9763,138.376435,True,1.0,claude-opus-4-1-20250805,log-summary-date-ranges,138.376435,True,0.8888888888888888,True,138.376435 +7f0add51-8baf-4af7-b687-d4a6ae1de47f,grok-4-0709,xai,reshard-c4-data,2378,631,3009,909.682071,False,0.0,grok-4-0709,reshard-c4-data,909.682071,False,0.0,False,909.682071 +60ee2b95-9ee2-489a-b2ea-828a924a1dba,gpt-5-nano,openai,build-pmars,8398,6145,14543,910.247932,False,0.0,gpt-5-nano,build-pmars,910.247932,False,0.0,False,910.247932 +d8c24f23-a54d-4ab0-9f4e-3def8991fd93,OpenAI/gpt-oss-20B,together_ai,pytorch-model-cli,518,755,1273,27.416625,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-cli,27.416625,False,0.0,False,27.416625 +d0dae0b3-3724-4764-a61c-8c7dbf72d512,gemini-2.5-pro,gemini,winning-avg-corewars,11535,15915,27450,3606.094026,False,0.0,gemini-2.5-pro,winning-avg-corewars,3606.094026,False,0.0,False,3606.094026 +5d466124-a81f-41bd-a4c3-9fa7cd305594,gpt-5,openai,schemelike-metacircular-eval,6587,6873,13460,2402.016763,False,0.0,gpt-5,schemelike-metacircular-eval,2402.016763,False,0.0,False,2402.016763 +ea6014af-ac3f-4ead-8747-bc79e988f823,OpenAI/gpt-oss-20B,together_ai,fix-ocaml-gc,13372,65037,78409,3600.737771,False,0.0,OpenAI/gpt-oss-20B,fix-ocaml-gc,3600.737771,False,0.0,False,3600.737771 +ef7bc6f1-4814-46de-a337-abe419867f9a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sparql-university,2696,1211,3907,595.921087,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sparql-university,595.921087,False,0.0,False,595.921087 +71183fc6-dbc9-46fb-8701-f0cc89b75a0e,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-alpine-ssh,3823,7345,11168,900.26263,False,0.0,moonshotai/Kimi-K2-Instruct-0905,qemu-alpine-ssh,900.26263,False,0.0,False,900.26263 +f1899341-b1ba-4c56-b669-3b3a8450598f,gpt-5,openai,nginx-request-logging,3877,1428,5305,148.27305,True,1.0,gpt-5,nginx-request-logging,148.27305,True,1.0,True,148.27305 +5cf8df3c-1403-4ada-bc71-535d42b2fd24,grok-code-fast-1,xai,reshard-c4-data,2786,3111,5897,426.803332,False,0.0,grok-code-fast-1,reshard-c4-data,426.803332,False,0.0,False,426.803332 +9384f5b8-214c-427b-990b-de9cfce76bdb,moonshotai/Kimi-K2-Instruct-0905,together_ai,winning-avg-corewars,10622,10195,20817,836.514908,False,0.0,moonshotai/Kimi-K2-Instruct-0905,winning-avg-corewars,836.514908,False,0.0,False,836.514908 +e6161e63-53b9-41ee-872e-8441a6aa0f60,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,largest-eigenval,4650,3804,8454,913.102286,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,largest-eigenval,913.102286,False,0.2,False,913.102286 +7610a108-98fa-4b7b-9d03-415b142978eb,claude-opus-4-1-20250805,anthropic,video-processing,4070,3008,7078,96.72613,False,0.0,claude-opus-4-1-20250805,video-processing,96.72613,False,0.0,False,96.72613 +612f0235-3d20-4445-8049-029a38755416,zai-org/GLM-4.5-Air-FP8,together_ai,sanitize-git-repo,7833,5361,13194,278.406908,False,0.0,zai-org/GLM-4.5-Air-FP8,sanitize-git-repo,278.406908,False,0.0,False,278.406908 +f7e2dd74-15c0-40fb-9086-cb62e62c85e8,gemini-2.5-pro,gemini,qemu-alpine-ssh,1885,1693,3578,337.163325,False,0.0,gemini-2.5-pro,qemu-alpine-ssh,337.163325,False,0.2,False,337.163325 +44aa0c21-5e5f-4a62-a476-40c8430acb51,openai/gpt-oss-120b,together_ai,vulnerable-secret,12795,5955,18750,303.773106,False,0.0,openai/gpt-oss-120b,vulnerable-secret,303.773106,False,0.0,False,303.773106 +c780b22d-8449-4cdc-a780-497bb698fcdd,gpt-5-nano,openai,hf-model-inference,17417,10256,27673,908.559964,True,1.0,gpt-5-nano,hf-model-inference,908.559964,True,0.4,True,908.559964 +ebdf4de3-4492-47ad-9d54-6035269558e4,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing-reverse,30129,18994,49123,1435.217047,True,1.0,deepseek-ai/DeepSeek-V3.1,path-tracing-reverse,1435.217047,True,0.2,True,1435.217047 +5b39977e-c4a3-4cdb-9e7c-878dcab0d1a5,claude-opus-4-1-20250805,anthropic,fix-code-vulnerability,7923,3922,11845,952.519263,False,0.0,claude-opus-4-1-20250805,fix-code-vulnerability,952.519263,False,0.125,False,952.519263 +1b77a840-a6f8-4e67-a279-8cf7823604c1,gemini-2.5-pro,gemini,build-pmars,13762,5073,18835,454.624491,True,1.0,gemini-2.5-pro,build-pmars,454.624491,True,1.0,True,454.624491 +6c6eef6f-67ac-400d-a0af-a2241eb9b183,grok-4-0709,xai,dna-insert,4693,506,5199,387.284604,False,0.0,grok-4-0709,dna-insert,387.284604,False,0.0,False,387.284604 +95d942a2-62c2-44d1-b4da-0453f0154f5d,gemini-2.5-pro,gemini,log-summary-date-ranges,7364,2060,9424,392.271661,False,0.0,gemini-2.5-pro,log-summary-date-ranges,392.271661,False,0.0,False,392.271661 +eb745a21-d8b6-41f7-a97f-dccb3248c928,claude-sonnet-4-20250514,anthropic,sparql-university,7328,2548,9876,382.729176,False,0.0,claude-sonnet-4-20250514,sparql-university,382.729176,False,0.0,False,382.729176 +382de16c-b539-434b-83c0-a43a4e354b0b,moonshotai/Kimi-K2-Instruct-0905,together_ai,schemelike-metacircular-eval,27013,26934,53947,2435.919489,False,0.0,moonshotai/Kimi-K2-Instruct-0905,schemelike-metacircular-eval,2435.919489,False,0.0,False,2435.919489 +4281cf11-3c02-4696-b476-ae86a49c05b4,claude-opus-4-1-20250805,anthropic,video-processing,4024,3361,7385,337.285543,False,0.0,claude-opus-4-1-20250805,video-processing,337.285543,False,0.0,False,337.285543 +be95abe5-2741-4e76-9a18-923ab1ee9a25,gpt-5-mini,openai,prove-plus-comm,1479,910,2389,93.581642,True,1.0,gpt-5-mini,prove-plus-comm,93.581642,True,0.6,True,93.581642 +ba0b2cd9-beb9-4194-bd78-8d28ceba0bcc,moonshotai/Kimi-K2-Instruct-0905,together_ai,reverse-engineering,11770,12272,24042,1800.048259,False,0.0,moonshotai/Kimi-K2-Instruct-0905,reverse-engineering,1800.048259,False,0.2,False,1800.048259 +038cc009-23e9-4b09-931b-ee8d35985188,gemini-2.5-flash,gemini,mteb-retrieve,1951,879,2830,92.911694,False,0.0,gemini-2.5-flash,mteb-retrieve,92.911694,False,0.0,False,92.911694 +b8be46a6-ad64-44e1-93a4-f530eb59e722,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-differential-cryptanalysis,29385,29834,59219,1560.852697,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-differential-cryptanalysis,1560.852697,False,0.0,False,1560.852697 +a73ec9f9-2613-4db3-9a4b-ea2e4d0a271c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,write-compressor,1708,3268,4976,1205.02096,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,write-compressor,1205.02096,False,0.0,False,1205.02096 +be3618de-a0c0-4a68-b4e9-0a4309c9e10b,gemini-2.5-flash,gemini,build-initramfs-qemu,5987,2405,8392,136.46695,False,0.0,gemini-2.5-flash,build-initramfs-qemu,136.46695,False,0.0,False,136.46695 +9abfad31-2161-46bb-9453-2d7059b2f9fd,gpt-5,openai,filter-js-from-html,2385,1850,4235,513.369315,False,0.0,gpt-5,filter-js-from-html,513.369315,False,0.0,False,513.369315 +a5a65fa5-09d4-4e7d-8b68-f04aeec0e0e1,gpt-5-mini,openai,bn-fit-modify,9965,9544,19509,516.950439,False,0.0,gpt-5-mini,bn-fit-modify,516.950439,False,0.6,False,516.950439 +502f9f71-6539-468d-9d85-4d8825075884,gpt-5,openai,build-pov-ray,15482,5966,21448,693.824771,False,0.0,gpt-5,build-pov-ray,693.824771,False,0.0,False,693.824771 +7c278c4a-89d3-4b06-a594-1a7903cd80f8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-git,1854,1370,3224,73.546742,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-git,73.546742,False,0.0,False,73.546742 +6c2e55cf-3b8b-436a-bd66-ecb3ae6e3b74,deepseek-ai/DeepSeek-V3.1,together_ai,regex-log,3143,2660,5803,159.102717,False,0.0,deepseek-ai/DeepSeek-V3.1,regex-log,159.102717,False,0.2,False,159.102717 +b7dfa100-d590-4f89-930e-60354663b18b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-ocaml-gc,100607,22677,123284,3602.62982,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-ocaml-gc,3602.62982,False,0.0,False,3602.62982 +d950ea69-fb26-4f9d-952e-438aaad28903,gpt-5-nano,openai,pytorch-model-cli,1993,1705,3698,228.27177,False,0.0,gpt-5-nano,pytorch-model-cli,228.27177,False,0.0,False,228.27177 +1d609737-7f44-4c78-8e59-e10c2ddde87f,gpt-5,openai,build-cython-ext,6983,4986,11969,911.364356,False,0.0,gpt-5,build-cython-ext,911.364356,False,0.0,False,911.364356 +79c59929-1b11-4122-b5ea-d3564eba9bfa,gpt-5,openai,filter-js-from-html,2829,1660,4489,190.504802,False,0.0,gpt-5,filter-js-from-html,190.504802,False,0.0,False,190.504802 +f3209a38-095f-4b2a-af15-d86fc4264d5f,gpt-5,openai,schemelike-metacircular-eval,38885,54978,93863,2400.007932,False,0.0,gpt-5,schemelike-metacircular-eval,2400.007932,False,0.0,False,2400.007932 +117e281a-7f97-4c9a-bd8c-575d07d72161,openai/gpt-oss-120b,together_ai,break-filter-js-from-html,1596,881,2477,115.633334,False,0.0,openai/gpt-oss-120b,break-filter-js-from-html,115.633334,False,0.0,False,115.633334 +00bc7790-2d01-4841-bab5-43d50d17197c,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-rust-c,1652,4232,5884,94.30796,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-rust-c,94.30796,False,0.0,False,94.30796 +7aa9233a-eb99-4bc1-b8fd-f0ceeef3c326,claude-opus-4-1-20250805,anthropic,gpt2-codegolf,27235,26878,54113,900.002203,False,0.0,claude-opus-4-1-20250805,gpt2-codegolf,900.002203,False,0.0,False,900.002203 +bc26752e-5bdf-4bd7-bf2b-52cd3235f7a7,gpt-5-nano,openai,build-pov-ray,2778,3569,6347,349.746264,False,0.0,gpt-5-nano,build-pov-ray,349.746264,False,0.0,False,349.746264 +bf5c4722-0681-4a25-9e99-117934b010eb,gpt-5-nano,openai,mteb-leaderboard,14381,19099,33480,1937.702894,False,0.0,gpt-5-nano,mteb-leaderboard,1937.702894,False,0.0,False,1937.702894 +0ec75d07-c134-446a-bb5f-3f5c4422bce9,grok-code-fast-1,xai,schemelike-metacircular-eval,4016,3194,7210,81.237479,False,0.0,grok-code-fast-1,schemelike-metacircular-eval,81.237479,False,0.0,False,81.237479 +f035797c-385c-4a15-a365-1927717a372c,claude-opus-4-1-20250805,anthropic,make-doom-for-mips,25747,12571,38318,900.003115,False,0.0,claude-opus-4-1-20250805,make-doom-for-mips,900.003115,False,0.0,False,900.003115 +d8e1bb84-c799-4a3c-82a5-7df1b83bcf42,claude-sonnet-4-20250514,anthropic,hf-model-inference,6166,3907,10073,528.661928,False,0.0,claude-sonnet-4-20250514,hf-model-inference,528.661928,False,0.2,False,528.661928 +5001f33a-d49b-4725-b868-40a3a9f0088a,grok-4-0709,xai,pytorch-model-recovery,5125,5006,10131,903.527938,False,0.0,grok-4-0709,pytorch-model-recovery,903.527938,False,0.2,False,903.527938 +40dc62c4-302d-49ff-aaa6-027d78becd3c,OpenAI/gpt-oss-20B,together_ai,wasm-pipeline,223,1028,1251,922.103355,False,0.0,OpenAI/gpt-oss-20B,wasm-pipeline,922.103355,False,0.0,False,922.103355 +ab15ff57-828d-4ab1-8752-34bd1c0d9c90,gpt-5,openai,train-fasttext,15316,8688,24004,3600.5908,False,0.0,gpt-5,train-fasttext,3600.5908,False,0.0,False,3600.5908 +498aeac8-5ec1-4bf3-84d1-49ea13ff1c24,gpt-5-nano,openai,cobol-modernization,15362,19656,35018,906.29711,False,0.0,gpt-5-nano,cobol-modernization,906.29711,False,0.4,False,906.29711 +ee448201-b409-4db9-b531-7e4362d0bcfc,grok-code-fast-1,xai,path-tracing,2974,2984,5958,468.402407,False,0.0,grok-code-fast-1,path-tracing,468.402407,False,0.0,False,468.402407 +dc9909e3-9db6-46cf-b626-5a8a02d86427,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,constraints-scheduling,16021,15737,31758,1204.966363,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,constraints-scheduling,1204.966363,True,1.0,True,1204.966363 +55446577-2f3e-4f12-81f9-62ba0335484a,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-ocaml-gc,45941,18355,64296,2191.174596,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-ocaml-gc,2191.174596,False,0.0,False,2191.174596 +9efc1715-dc10-43ab-894c-5760b5bc96f2,gpt-5-mini,openai,log-summary-date-ranges,5522,1306,6828,115.511487,False,0.0,gpt-5-mini,log-summary-date-ranges,115.511487,False,0.0,False,115.511487 +13a8e061-4a0f-4183-95fb-28fc4783fc64,claude-opus-4-1-20250805,anthropic,winning-avg-corewars,71410,73746,145156,3600.003512,False,0.0,claude-opus-4-1-20250805,winning-avg-corewars,3600.003512,False,0.3333333333333333,False,3600.003512 +d79fa122-ecd8-46d8-993a-066b8fe48c5d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,port-compressor,111423,60551,171974,3600.012846,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,port-compressor,3600.012846,False,0.0,False,3600.012846 +be45e906-45c3-4604-b38f-dd3ff98216a7,grok-4-0709,xai,chess-best-move,13818,3048,16866,903.856588,False,0.0,grok-4-0709,chess-best-move,903.856588,False,0.0,False,903.856588 +371272f2-e40d-41da-a6cf-a42b7a406413,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,log-summary-date-ranges,4188,1685,5873,103.066969,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,log-summary-date-ranges,103.066969,False,0.0,False,103.066969 +94289b2a-8326-4d30-a761-a6322b7c715d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,torch-tensor-parallelism,4588,2629,7217,246.88208,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,torch-tensor-parallelism,246.88208,False,0.0,False,246.88208 +ced8e5ff-93dc-482e-91fd-7fefe669c916,gpt-5,openai,sqlite-db-truncate,7778,6943,14721,426.899398,False,0.0,gpt-5,sqlite-db-truncate,426.899398,False,0.0,False,426.899398 +9e7e6013-d316-401d-9db8-4ee78c7f2caf,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,torch-tensor-parallelism,1567,728,2295,52.583436,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,torch-tensor-parallelism,52.583436,False,0.0,False,52.583436 +62a09aec-f472-43a2-81ae-a6162b9a55de,gpt-5,openai,write-compressor,797,609,1406,900.527563,False,0.0,gpt-5,write-compressor,900.527563,False,0.3333333333333333,False,900.527563 +805ae946-1ad2-49ee-947f-3beb0cc852ea,moonshotai/Kimi-K2-Instruct-0905,together_ai,adaptive-rejection-sampler,11078,9388,20466,909.112255,False,0.0,moonshotai/Kimi-K2-Instruct-0905,adaptive-rejection-sampler,909.112255,False,0.0,False,909.112255 +ffa9d467-0c7f-459c-9325-00e41e45acca,gpt-5-mini,openai,mteb-retrieve,2679,1877,4556,196.847309,False,0.0,gpt-5-mini,mteb-retrieve,196.847309,False,0.0,False,196.847309 +f83aa081-4b9c-47a3-98c4-3a51c2e0ab1c,gpt-5,openai,prove-plus-comm,1822,1273,3095,205.355998,True,1.0,gpt-5,prove-plus-comm,205.355998,True,0.8571428571428571,True,205.355998 +7ded1b3b-dd51-472e-9233-1a5f6557ad7c,grok-4-0709,xai,nginx-request-logging,3767,1489,5256,353.170968,True,1.0,grok-4-0709,nginx-request-logging,353.170968,True,1.0,True,353.170968 +b46001ea-ae53-41e0-a41a-0a0f78529981,gpt-5-mini,openai,db-wal-recovery,1994,2318,4312,171.910375,False,0.0,gpt-5-mini,db-wal-recovery,171.910375,False,0.0,False,171.910375 +1af73754-908d-48a5-8f4d-670dad2c377b,gpt-5-nano,openai,crack-7z-hash,1899,1000,2899,68.582114,False,0.0,gpt-5-nano,crack-7z-hash,68.582114,False,0.0,False,68.582114 +826c11b1-3bf1-44e8-8e86-c44d87d8f23e,gpt-5-nano,openai,cancel-async-tasks,29694,38537,68231,1802.185056,False,0.0,gpt-5-nano,cancel-async-tasks,1802.185056,False,0.4,False,1802.185056 +868b95de-384a-49f1-bd00-8bff2712c038,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,write-compressor,2715,930,3645,1416.734966,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,write-compressor,1416.734966,False,0.0,False,1416.734966 +98a1727a-fad1-4d7e-8d7f-ed570888d97a,gpt-5,openai,cobol-modernization,4369,5006,9375,904.580499,True,1.0,gpt-5,cobol-modernization,904.580499,True,1.0,True,904.580499 +5f4402b0-4241-49e1-8b78-38a99fe8b5dd,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,form-filling,9057,7330,16387,901.912502,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,form-filling,901.912502,True,0.8,True,901.912502 +8dd05b49-b4e4-4652-87dd-207dc51d5387,claude-sonnet-4-20250514,anthropic,regex-log,3054,2041,5095,128.273127,False,0.0,claude-sonnet-4-20250514,regex-log,128.273127,False,0.8,False,128.273127 +53ef0924-cdc3-428e-803a-61a001840766,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,train-fasttext,14855,5557,20412,2193.987261,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,train-fasttext,2193.987261,False,0.0,False,2193.987261 +45527d41-9601-46e0-b195-1fa35851a8c1,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pmars,17848,5258,23106,514.548414,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pmars,514.548414,True,1.0,True,514.548414 +c4ff7377-67a7-4fb4-b2c9-5710a2048d31,grok-code-fast-1,xai,mteb-leaderboard,6496,2260,8756,368.17852,False,0.0,grok-code-fast-1,mteb-leaderboard,368.17852,False,0.0,False,368.17852 +fcd0f26c-31f1-451b-b757-7eb196284dd6,claude-opus-4-1-20250805,anthropic,wasm-pipeline,11512,4066,15578,238.562136,True,1.0,claude-opus-4-1-20250805,wasm-pipeline,238.562136,True,0.1428571428571428,True,238.562136 +08c2bd66-3b62-478d-9200-d64e4733a219,openai/gpt-oss-120b,together_ai,cobol-modernization,5547,3337,8884,200.779358,True,1.0,openai/gpt-oss-120b,cobol-modernization,200.779358,True,0.8,True,200.779358 +3d875769-e80b-4552-8b32-ad26630e8cb0,gpt-5,openai,install-klee-minimal,1766,1944,3710,900.057718,False,0.0,gpt-5,install-klee-minimal,900.057718,False,0.0,False,900.057718 +c8c48058-b27c-449a-974e-ea78273028a5,gpt-5-mini,openai,port-compressor,21095,21958,43053,3607.063215,False,0.0,gpt-5-mini,port-compressor,3607.063215,False,0.0,False,3607.063215 +559b97d7-851a-49d4-808b-5b4fa4a20bfa,zai-org/GLM-4.5-Air-FP8,together_ai,video-processing,3409,2537,5946,234.021947,False,0.0,zai-org/GLM-4.5-Air-FP8,video-processing,234.021947,False,0.0,False,234.021947 +51f929c3-0647-4c4d-b3b4-b301cc62a0b1,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,install-windows-3.11,8795,4497,13292,919.509702,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,install-windows-3.11,919.509702,False,0.0,False,919.509702 +319f5b4a-1bdf-4402-8e19-2fdf06557625,moonshotai/Kimi-K2-Instruct-0905,together_ai,gpt2-codegolf,9919,10372,20291,662.719464,False,0.0,moonshotai/Kimi-K2-Instruct-0905,gpt2-codegolf,662.719464,False,0.0,False,662.719464 +ddee4f23-9621-449a-ae45-e4b4b8d12da6,claude-sonnet-4-20250514,anthropic,qemu-startup,5031,7894,12925,903.382758,False,0.0,claude-sonnet-4-20250514,qemu-startup,903.382758,False,0.4,False,903.382758 +71b22a5b-0aca-4179-b08d-e6f251152f28,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-alpine-ssh,2001,2805,4806,238.972082,False,0.0,moonshotai/Kimi-K2-Instruct-0905,qemu-alpine-ssh,238.972082,False,0.0,False,238.972082 +666c604c-9a58-454d-9f70-fafdaa8233bc,gpt-5-mini,openai,model-extraction-relu-logits,2065,1699,3764,431.490574,False,0.0,gpt-5-mini,model-extraction-relu-logits,431.490574,False,0.0,False,431.490574 +01e1fd5d-74d3-4bb1-bab1-960864d0b1f9,zai-org/GLM-4.5-Air-FP8,together_ai,code-from-image,16666,16779,33445,844.295601,False,0.0,zai-org/GLM-4.5-Air-FP8,code-from-image,844.295601,False,0.2,False,844.295601 +a520c6b7-3bab-40ca-9113-e1bbef7cff5e,grok-code-fast-1,xai,sqlite-db-truncate,2057,1403,3460,237.207365,False,0.0,grok-code-fast-1,sqlite-db-truncate,237.207365,False,0.0,False,237.207365 +77d7cbae-288b-4ea7-9d0b-df6f4b4279b9,grok-code-fast-1,xai,bn-fit-modify,5345,4002,9347,369.947591,False,0.0,grok-code-fast-1,bn-fit-modify,369.947591,False,0.0,False,369.947591 +6447806c-dc8d-45e7-b25a-96d83e545f11,openai/gpt-oss-120b,together_ai,crack-7z-hash,8055,3602,11657,220.401171,False,0.0,openai/gpt-oss-120b,crack-7z-hash,220.401171,False,0.0,False,220.401171 +617ec320-3bc9-445e-89b1-015a3f635150,grok-4-0709,xai,sqlite-db-truncate,1664,1308,2972,314.616573,False,0.0,grok-4-0709,sqlite-db-truncate,314.616573,False,0.0,False,314.616573 +c433bb70-3d29-4517-92c6-3e8ba4f64b8b,deepseek-ai/DeepSeek-V3.1,together_ai,build-pmars,11208,2734,13942,345.27496,True,1.0,deepseek-ai/DeepSeek-V3.1,build-pmars,345.27496,True,1.0,True,345.27496 +0d643e75-f492-44a8-92b3-10cd14ea0adb,deepseek-ai/DeepSeek-V3.1,together_ai,filter-js-from-html,3097,5315,8412,789.684955,False,0.0,deepseek-ai/DeepSeek-V3.1,filter-js-from-html,789.684955,False,0.0,False,789.684955 +67b351a2-e03e-4e78-afc5-d5467aaf9250,gpt-5,openai,qemu-startup,1467,811,2278,228.781141,True,1.0,gpt-5,qemu-startup,228.781141,True,0.8,True,228.781141 +1be98eea-b9ea-4d38-a068-9d93efe202f7,zai-org/GLM-4.5-Air-FP8,together_ai,db-wal-recovery,3555,4979,8534,321.451714,False,0.0,zai-org/GLM-4.5-Air-FP8,db-wal-recovery,321.451714,False,0.0,False,321.451714 +21a9659f-de06-42f2-9d1d-82b0b91f417e,OpenAI/gpt-oss-20B,together_ai,extract-elf,4909,13385,18294,902.545987,False,0.0,OpenAI/gpt-oss-20B,extract-elf,902.545987,False,0.2,False,902.545987 +9ea2f631-50b2-41fc-becb-fc67a783caf8,claude-sonnet-4-20250514,anthropic,build-pov-ray,21644,10130,31774,1275.507878,True,1.0,claude-sonnet-4-20250514,build-pov-ray,1275.507878,True,0.6,True,1275.507878 +987274e9-3af2-4985-a9ab-caed1fafbf2f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reshard-c4-data,11371,8681,20052,902.722468,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reshard-c4-data,902.722468,False,0.0,False,902.722468 +73817b8e-be63-4f2b-8f38-fae064fee451,gpt-5-nano,openai,distribution-search,27005,45690,72695,3623.688132,False,0.0,gpt-5-nano,distribution-search,3623.688132,False,0.25,False,3623.688132 +8a802119-742c-4c1c-aa94-e684193f40ee,grok-code-fast-1,xai,count-dataset-tokens,7103,1856,8959,935.432369,False,0.0,grok-code-fast-1,count-dataset-tokens,935.432369,False,0.0,False,935.432369 +a0b5aa9d-3733-451d-ab04-0faae65c02b4,deepseek-ai/DeepSeek-V3.1,together_ai,fix-git,7034,2529,9563,1711.423649,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-git,1711.423649,False,0.8,False,1711.423649 +3c51cb50-3450-4ca4-bcb2-38581be30242,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-assembly,16096,12314,28410,738.702978,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-assembly,738.702978,False,0.0,False,738.702978 +c8fe452a-3a6a-45ee-a35f-df55603648f5,gpt-5,openai,make-mips-interpreter,8920,30797,39717,1801.337443,False,0.0,gpt-5,make-mips-interpreter,1801.337443,False,0.0,False,1801.337443 +1356f66c-3dd3-4172-a61e-bed038adb22f,moonshotai/Kimi-K2-Instruct-0905,together_ai,regex-log,3478,4053,7531,674.1976,False,0.0,moonshotai/Kimi-K2-Instruct-0905,regex-log,674.1976,False,0.4,False,674.1976 +5636de4e-337b-4383-90a8-5505af001b2c,gpt-5,openai,prove-plus-comm,1931,1316,3247,284.737252,True,1.0,gpt-5,prove-plus-comm,284.737252,True,0.8571428571428571,True,284.737252 +ed7cd3da-e642-4230-85b9-b4aa1476f314,gpt-5,openai,install-windows-3.11,8383,2860,11243,467.275171,False,0.0,gpt-5,install-windows-3.11,467.275171,False,0.0,False,467.275171 +9b0e0c0c-2413-4c1c-b0a1-f627d2e7290e,deepseek-ai/DeepSeek-V3.1,together_ai,vulnerable-secret,8294,7652,15946,340.363162,True,1.0,deepseek-ai/DeepSeek-V3.1,vulnerable-secret,340.363162,True,0.4,True,340.363162 +50bc0e4a-e2a7-4c25-905e-a6e988ee22aa,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,financial-document-processor,10923,5184,16107,513.325155,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,financial-document-processor,513.325155,False,0.0,False,513.325155 +8d358420-62e4-4edc-b062-018556def2d8,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-alpine-ssh,3693,6632,10325,858.671527,False,0.0,zai-org/GLM-4.5-Air-FP8,qemu-alpine-ssh,858.671527,False,0.0,False,858.671527 +c335124e-6426-47cb-9c63-39b9c66da73c,gemini-2.5-flash,gemini,financial-document-processor,14040,12724,26764,1172.18605,False,0.0,gemini-2.5-flash,financial-document-processor,1172.18605,False,0.0,False,1172.18605 +3515c5ce-4ba8-43d8-8b4a-7548d84bc8dd,openai/gpt-oss-120b,together_ai,install-windows-3.11,5656,1555,7211,214.174458,False,0.0,openai/gpt-oss-120b,install-windows-3.11,214.174458,False,0.0,False,214.174458 +6fa06099-a8bd-4ff8-b824-16b2daa5eea2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,schemelike-metacircular-eval,15997,15179,31176,1705.2129,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,schemelike-metacircular-eval,1705.2129,False,0.0,False,1705.2129 +c89e0420-4761-467c-b267-37aedc652e7a,claude-opus-4-1-20250805,anthropic,polyglot-rust-c,3750,3784,7534,1007.816809,False,0.0,claude-opus-4-1-20250805,polyglot-rust-c,1007.816809,False,0.0,False,1007.816809 +ff5cd529-5759-4b07-a7b4-eb1e3cbb354a,deepseek-ai/DeepSeek-V3.1,together_ai,gpt2-codegolf,8692,7125,15817,696.311305,False,0.0,deepseek-ai/DeepSeek-V3.1,gpt2-codegolf,696.311305,False,0.0,False,696.311305 +77ddeb19-484d-4669-a7f3-fc61f0353db2,gemini-2.5-pro,gemini,pytorch-model-cli,2185,1710,3895,97.803647,False,0.0,gemini-2.5-pro,pytorch-model-cli,97.803647,False,0.4,False,97.803647 +8b14f17c-3f53-44ba-a659-04f02e2db82b,openai/gpt-oss-120b,together_ai,sqlite-db-truncate,3307,2665,5972,798.021671,False,0.0,openai/gpt-oss-120b,sqlite-db-truncate,798.021671,False,0.0,False,798.021671 +c09d888f-0f84-42af-bd81-9307a68008a2,claude-opus-4-1-20250805,anthropic,mteb-retrieve,2170,1457,3627,81.395991,False,0.0,claude-opus-4-1-20250805,mteb-retrieve,81.395991,False,0.0,False,81.395991 +53f37b48-29fc-4014-ba84-9dff7882a6e6,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-db-truncate,3548,1734,5282,603.436217,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-db-truncate,603.436217,False,0.0,False,603.436217 +bc534b5c-5edc-4565-a997-d1064d098903,gpt-5,openai,mteb-leaderboard,31486,17980,49466,2711.199834,False,0.0,gpt-5,mteb-leaderboard,2711.199834,False,0.0,False,2711.199834 +9019bce4-5144-444b-a5c5-17943cf89756,claude-opus-4-1-20250805,anthropic,cancel-async-tasks,5276,3662,8938,407.661187,False,0.0,claude-opus-4-1-20250805,cancel-async-tasks,407.661187,False,0.125,False,407.661187 +e84f9480-c3bf-44bc-abc6-fcd83b7d9366,gemini-2.5-flash,gemini,dna-assembly,0,0,0,730.423479,False,0.0,gemini-2.5-flash,dna-assembly,730.423479,False,0.0,False,730.423479 +7ceca493-3cb9-4d35-9826-794cd42dae4a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-cython-ext,17439,6125,23564,900.451124,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-cython-ext,900.451124,False,0.0,False,900.451124 +94a160a6-b1b5-4717-8d02-3f16d21a5349,moonshotai/Kimi-K2-Instruct-0905,together_ai,port-compressor,80147,39948,120095,1473.23885,False,0.0,moonshotai/Kimi-K2-Instruct-0905,port-compressor,1473.23885,False,0.0,False,1473.23885 +8864f8dd-7ec5-4830-8214-c46ad3c36599,openai/gpt-oss-120b,together_ai,dna-insert,1630,1665,3295,362.636901,False,0.0,openai/gpt-oss-120b,dna-insert,362.636901,False,0.0,False,362.636901 +a7af89f4-944b-477a-ac52-4c7df1305aee,claude-sonnet-4-20250514,anthropic,log-summary-date-ranges,9221,3105,12326,251.878141,True,1.0,claude-sonnet-4-20250514,log-summary-date-ranges,251.878141,True,1.0,True,251.878141 +1bcbf4b8-2e6b-4b7c-949d-6e56a4c7addb,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,hf-model-inference,6517,2025,8542,894.896704,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,hf-model-inference,894.896704,True,0.8,True,894.896704 +259a0e46-d613-45fc-9924-6c46b5dd62fc,grok-4-0709,xai,build-pov-ray,28844,8700,37544,1959.123888,True,1.0,grok-4-0709,build-pov-ray,1959.123888,True,1.0,True,1959.123888 +af9d300f-272e-4492-b156-80bf6a2f5210,gemini-2.5-flash,gemini,cobol-modernization,4905,3917,8822,174.45787,False,0.0,gemini-2.5-flash,cobol-modernization,174.45787,False,0.2,False,174.45787 +1160389f-7de8-4a58-ab22-0fe95209e81b,grok-4-0709,xai,build-initramfs-qemu,1310,1345,2655,954.757592,False,0.0,grok-4-0709,build-initramfs-qemu,954.757592,False,0.0,False,954.757592 +07146589-b046-4b5c-bdc1-6aa2f0b412d5,claude-opus-4-1-20250805,anthropic,gpt2-codegolf,12052,13450,25502,900.035935,False,0.0,claude-opus-4-1-20250805,gpt2-codegolf,900.035935,False,0.0,False,900.035935 +37c8c9d8-62ba-4b65-8f8e-c69688f862b2,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-git,2318,1284,3602,101.84988,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-git,101.84988,False,0.0,False,101.84988 +338b1c84-067f-4fd9-b8ec-fb8eace91e00,claude-opus-4-1-20250805,anthropic,write-compressor,11522,8749,20271,900.52265,False,0.0,claude-opus-4-1-20250805,write-compressor,900.52265,False,0.0,False,900.52265 +1a8b49d3-d115-4794-966b-0b697e0022db,gpt-5-nano,openai,regex-log,3157,2782,5939,449.711529,True,1.0,gpt-5-nano,regex-log,449.711529,True,0.2,True,449.711529 +9d84a83f-581b-4b4e-a894-0a71697ebebc,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-code-vulnerability,8892,1813,10705,947.507452,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-code-vulnerability,947.507452,False,0.4,False,947.507452 +ece02cc6-a3c5-4969-a7d3-b85ffc7f7368,grok-code-fast-1,xai,port-compressor,27795,19859,47654,1316.031081,False,0.0,grok-code-fast-1,port-compressor,1316.031081,False,0.0,False,1316.031081 +42597e46-a6a2-4106-991e-24215edae1b2,zai-org/GLM-4.5-Air-FP8,together_ai,git-leak-recovery,2174,1988,4162,171.647829,True,1.0,zai-org/GLM-4.5-Air-FP8,git-leak-recovery,171.647829,True,0.8,True,171.647829 +069d7ca8-b547-4f96-ba27-e935985b8439,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,password-recovery,1569,1803,3372,1324.457706,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,password-recovery,1324.457706,False,0.0,False,1324.457706 +4598f8be-a0a2-458e-a31c-d59dd56154cf,claude-opus-4-1-20250805,anthropic,largest-eigenval,6967,5738,12705,906.470496,False,0.0,claude-opus-4-1-20250805,largest-eigenval,906.470496,False,0.25,False,906.470496 +40546e59-25d0-4530-8155-6a294d001126,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,run-pdp11-code,3266,1328,4594,1064.583774,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,run-pdp11-code,1064.583774,False,0.0,False,1064.583774 +e62d30a4-2f82-4ad7-8b4a-380a802a1e6e,zai-org/GLM-4.5-Air-FP8,together_ai,cancel-async-tasks,456,1217,1673,185.145985,False,0.0,zai-org/GLM-4.5-Air-FP8,cancel-async-tasks,185.145985,False,0.2,False,185.145985 +12cc21bc-0d8e-4675-964b-c67d323cf3e2,gemini-2.5-pro,gemini,port-compressor,24265,20639,44904,3618.339634,False,0.0,gemini-2.5-pro,port-compressor,3618.339634,False,0.0,False,3618.339634 +206a9c8e-e70f-4a0d-8e2a-34222840df5b,grok-code-fast-1,xai,constraints-scheduling,3504,3866,7370,83.74445,True,1.0,grok-code-fast-1,constraints-scheduling,83.74445,True,0.8,True,83.74445 +3f11f238-54d4-4ac8-8582-51ede6a41a70,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,model-extraction-relu-logits,7875,9060,16935,912.443051,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,model-extraction-relu-logits,912.443051,False,0.0,False,912.443051 +92c3c4a2-3827-4778-b519-b20bd53c5d88,OpenAI/gpt-oss-20B,together_ai,password-recovery,985,2531,3516,87.003179,False,0.0,OpenAI/gpt-oss-20B,password-recovery,87.003179,False,0.0,False,87.003179 +7137e1ff-6000-414f-a5f6-cfd1125be95a,gpt-5-nano,openai,count-dataset-tokens,7858,3099,10957,925.964914,False,0.0,gpt-5-nano,count-dataset-tokens,925.964914,False,0.0,False,925.964914 +3d6d09c9-79e2-443b-81d6-faae4f95ece1,gpt-5-mini,openai,fix-ocaml-gc,25090,15903,40993,3637.845316,False,0.0,gpt-5-mini,fix-ocaml-gc,3637.845316,False,0.0,False,3637.845316 +f80a04e9-2b60-4aff-8a2c-4a6ea03bf2c5,claude-opus-4-1-20250805,anthropic,build-pmars,14352,2613,16965,160.044596,True,1.0,claude-opus-4-1-20250805,build-pmars,160.044596,True,0.5,True,160.044596 +3cea762d-1761-4a8f-9ca0-cdb45e4c88c2,grok-4-0709,xai,code-from-image,782,339,1121,1866.739917,False,0.0,grok-4-0709,code-from-image,1866.739917,False,0.0,False,1866.739917 +1150d6b4-3ff6-45d9-af5a-c148d2306177,gpt-5,openai,polyglot-c-py,1650,1105,2755,145.604507,False,0.0,gpt-5,polyglot-c-py,145.604507,False,0.0,False,145.604507 +96e567d9-321f-4490-a62e-22f6da435d14,OpenAI/gpt-oss-20B,together_ai,password-recovery,1224,1655,2879,80.332563,False,0.0,OpenAI/gpt-oss-20B,password-recovery,80.332563,False,0.0,False,80.332563 +62195ec7-b3ea-4f19-828d-8fcc0b60bc6d,moonshotai/Kimi-K2-Instruct-0905,together_ai,wasm-pipeline,11030,5535,16565,357.450057,False,0.0,moonshotai/Kimi-K2-Instruct-0905,wasm-pipeline,357.450057,False,0.2,False,357.450057 +aaeba6f7-a66d-4806-ac10-9a74ec798f11,gemini-2.5-flash,gemini,qemu-alpine-ssh,1338,1275,2613,186.207167,False,0.0,gemini-2.5-flash,qemu-alpine-ssh,186.207167,False,0.0,False,186.207167 +5f319ce4-f7c9-46c9-be10-dc4663a3af32,grok-4-0709,xai,mteb-retrieve,1785,962,2747,209.238869,False,0.0,grok-4-0709,mteb-retrieve,209.238869,False,0.0,False,209.238869 +7ad03ceb-6e84-452f-8bf9-d79866746e59,claude-opus-4-1-20250805,anthropic,polyglot-rust-c,18274,20010,38284,900.002896,False,0.0,claude-opus-4-1-20250805,polyglot-rust-c,900.002896,False,0.0,False,900.002896 +3e9afe9b-db9a-43e8-a4b8-b907adcfab7e,deepseek-ai/DeepSeek-V3.1,together_ai,password-recovery,3820,3996,7816,902.604878,False,0.0,deepseek-ai/DeepSeek-V3.1,password-recovery,902.604878,False,0.0,False,902.604878 +0380d20f-a843-427a-a5a1-7f3ff93cd53d,deepseek-ai/DeepSeek-V3.1,together_ai,model-extraction-relu-logits,9212,5491,14703,463.33761,False,0.0,deepseek-ai/DeepSeek-V3.1,model-extraction-relu-logits,463.33761,False,0.2,False,463.33761 +9d965db5-b38c-458b-b1a2-17df6b98bf07,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cancel-async-tasks,7985,5583,13568,900.04131,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cancel-async-tasks,900.04131,True,0.6,True,900.04131 +b63d7f95-2fbe-40e0-945c-a2ff495c6f8f,deepseek-ai/DeepSeek-V3.1,together_ai,port-compressor,37048,22052,59100,3604.34111,False,0.0,deepseek-ai/DeepSeek-V3.1,port-compressor,3604.34111,False,0.0,False,3604.34111 +1f72b7a6-faaa-4d08-9cff-68c142c80902,zai-org/GLM-4.5-Air-FP8,together_ai,fix-git,17313,4172,21485,902.426968,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-git,902.426968,False,0.6,False,902.426968 +a14b0b9d-df3b-4a9d-bbd3-8305da6d1cbb,claude-opus-4-1-20250805,anthropic,vulnerable-secret,5432,4846,10278,382.275678,True,1.0,claude-opus-4-1-20250805,vulnerable-secret,382.275678,True,0.625,True,382.275678 +72041167-8233-4bcb-8065-704fec899395,grok-code-fast-1,xai,build-initramfs-qemu,1959,1086,3045,80.830086,False,0.0,grok-code-fast-1,build-initramfs-qemu,80.830086,False,0.0,False,80.830086 +2c5e55aa-a6b7-41c0-b558-ea35d34dab06,gpt-5-mini,openai,reverse-engineering,68147,89856,158003,7832.939551,False,0.0,gpt-5-mini,reverse-engineering,7832.939551,False,0.0,False,7832.939551 +732dab7e-bf5d-48cb-a0f7-724c75bed214,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-db-truncate,1980,1943,3923,900.048903,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-db-truncate,900.048903,False,0.0,False,900.048903 +569e2afa-1b3b-4705-9d79-403e7a9d9b7a,openai/gpt-oss-120b,together_ai,sanitize-git-repo,1954,1242,3196,93.422444,False,0.0,openai/gpt-oss-120b,sanitize-git-repo,93.422444,False,0.0,False,93.422444 +f23fff11-6f50-47e9-86f1-041580c2d253,gemini-2.5-pro,gemini,prove-plus-comm,1610,1375,2985,240.055873,True,1.0,gemini-2.5-pro,prove-plus-comm,240.055873,True,0.8,True,240.055873 +c95796cc-2261-42ee-a40d-583910b10742,gpt-5,openai,path-tracing,17096,10196,27292,1056.51882,False,0.0,gpt-5,path-tracing,1056.51882,False,0.0,False,1056.51882 +9b4d2167-867f-4846-b762-6476f4d17ac8,zai-org/GLM-4.5-Air-FP8,together_ai,break-filter-js-from-html,13638,16620,30258,1210.775896,False,0.0,zai-org/GLM-4.5-Air-FP8,break-filter-js-from-html,1210.775896,False,0.0,False,1210.775896 +1ce0fe41-f1c7-4bc0-8d1c-94bafbc5cc44,OpenAI/gpt-oss-20B,together_ai,tune-mjcf,2854,11242,14096,961.024847,False,0.0,OpenAI/gpt-oss-20B,tune-mjcf,961.024847,False,0.0,False,961.024847 +37509f38-6adc-4ef1-8386-42d58077ea1d,deepseek-ai/DeepSeek-V3.1,together_ai,cancel-async-tasks,3936,2864,6800,202.099645,True,1.0,deepseek-ai/DeepSeek-V3.1,cancel-async-tasks,202.099645,True,0.4,True,202.099645 +d4416e2d-af9f-42b9-814f-622638fc47c1,grok-code-fast-1,xai,build-cython-ext,9693,3548,13241,788.534485,False,0.0,grok-code-fast-1,build-cython-ext,788.534485,False,0.0,False,788.534485 +710a23fd-d90c-4c94-bf0b-71fdcc11b68c,claude-sonnet-4-20250514,anthropic,gpt2-codegolf,10002,9583,19585,900.08802,False,0.0,claude-sonnet-4-20250514,gpt2-codegolf,900.08802,False,0.0,False,900.08802 +3f7f6b20-2f2f-4152-83c3-86a307d0bb37,gemini-2.5-flash,gemini,sqlite-db-truncate,3847,3089,6936,135.79395,False,0.0,gemini-2.5-flash,sqlite-db-truncate,135.79395,False,0.0,False,135.79395 +2a7142e7-095e-4520-9798-3270a5c7f9a7,moonshotai/Kimi-K2-Instruct-0905,together_ai,nginx-request-logging,5740,3543,9283,467.707808,False,0.0,moonshotai/Kimi-K2-Instruct-0905,nginx-request-logging,467.707808,False,0.4,False,467.707808 +fc51335c-0530-4216-aa91-df9e144e442f,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-rust-c,4037,2195,6232,184.874006,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-rust-c,184.874006,False,0.0,False,184.874006 +4cb87081-fb52-408f-aae1-0511cff8c314,gpt-5-mini,openai,polyglot-c-py,11346,6744,18090,900.027405,False,0.0,gpt-5-mini,polyglot-c-py,900.027405,False,0.0,False,900.027405 +845da8d8-487b-4667-870b-e9582cae3407,gemini-2.5-flash,gemini,wasm-pipeline,8484,4297,12781,900.037555,False,0.0,gemini-2.5-flash,wasm-pipeline,900.037555,False,0.4,False,900.037555 +d7bfb42f-de75-4c2c-be83-ce71a305d884,OpenAI/gpt-oss-20B,together_ai,install-klee-minimal,578,1027,1605,132.403881,False,0.0,OpenAI/gpt-oss-20B,install-klee-minimal,132.403881,False,0.0,False,132.403881 +71c3752a-1ee1-4939-a0aa-0ecce60cf68a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,openssl-selfsigned-cert,3197,2271,5468,169.391154,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,openssl-selfsigned-cert,169.391154,True,0.4,True,169.391154 +95912b7e-a302-486c-aca7-fcbece978172,openai/gpt-oss-120b,together_ai,model-extraction-relu-logits,1544,1157,2701,94.462799,False,0.0,openai/gpt-oss-120b,model-extraction-relu-logits,94.462799,False,0.0,False,94.462799 +54ebaaa4-3ab0-4a84-b723-52034a84757c,claude-sonnet-4-20250514,anthropic,adaptive-rejection-sampler,12174,9193,21367,900.005874,False,0.0,claude-sonnet-4-20250514,adaptive-rejection-sampler,900.005874,False,0.0,False,900.005874 +66da4493-692e-4994-b2c2-b643413bb672,OpenAI/gpt-oss-20B,together_ai,make-doom-for-mips,2024,8619,10643,917.600996,False,0.0,OpenAI/gpt-oss-20B,make-doom-for-mips,917.600996,False,0.0,False,917.600996 +2f0c5bb1-82c1-4057-a4bb-af22f7e5b3fd,moonshotai/Kimi-K2-Instruct-0905,together_ai,wasm-pipeline,8289,3391,11680,634.842622,False,0.0,moonshotai/Kimi-K2-Instruct-0905,wasm-pipeline,634.842622,False,0.2,False,634.842622 +9191c061-94bc-4190-a7ff-d9bac3e10a5c,claude-opus-4-1-20250805,anthropic,git-leak-recovery,3050,1999,5049,316.178437,True,1.0,claude-opus-4-1-20250805,git-leak-recovery,316.178437,True,1.0,True,316.178437 +619cec56-9023-4590-92ee-2bc921101657,gpt-5,openai,financial-document-processor,14312,14385,28697,609.575185,False,0.0,gpt-5,financial-document-processor,609.575185,False,0.0,False,609.575185 +f4a92dd1-8e89-40ea-8866-45fef756e430,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,configure-git-webserver,7358,2969,10327,900.518605,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,configure-git-webserver,900.518605,True,0.6,True,900.518605 +19859aa6-f1cc-4e75-a2a6-5db0156a6d06,gpt-5-mini,openai,count-dataset-tokens,16092,9492,25584,915.990035,False,0.0,gpt-5-mini,count-dataset-tokens,915.990035,False,0.0,False,915.990035 +a77fd5b8-34f9-4c5c-a566-ab006916f2fc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,adaptive-rejection-sampler,8026,4486,12512,910.351965,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,adaptive-rejection-sampler,910.351965,False,0.0,False,910.351965 +9ae38130-a5d9-4d32-92ba-3b0031549ab2,OpenAI/gpt-oss-20B,together_ai,make-mips-interpreter,8008,20931,28939,1806.003414,False,0.0,OpenAI/gpt-oss-20B,make-mips-interpreter,1806.003414,False,0.0,False,1806.003414 +b567729b-1838-46c1-8325-930ad2d31507,grok-4-0709,xai,extract-elf,4350,2136,6486,893.761135,False,0.0,grok-4-0709,extract-elf,893.761135,False,0.2,False,893.761135 +59230b88-d3e4-4114-b784-a545e4d4f7ec,grok-code-fast-1,xai,extract-elf,6842,1312,8154,96.344268,False,0.0,grok-code-fast-1,extract-elf,96.344268,False,0.6,False,96.344268 +e5b9f04d-951c-4611-8087-b24b3fa3d703,openai/gpt-oss-120b,together_ai,fix-git,4219,1680,5899,124.362502,True,1.0,openai/gpt-oss-120b,fix-git,124.362502,True,0.6,True,124.362502 +5189fbf9-0111-4150-a0f1-9fd78ab8d132,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,count-dataset-tokens,14850,3126,17976,647.452753,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,count-dataset-tokens,647.452753,False,0.0,False,647.452753 +230ef66e-5a8b-4b46-8ddc-727491b5b964,gpt-5-mini,openai,count-dataset-tokens,11672,8275,19947,908.704351,False,0.0,gpt-5-mini,count-dataset-tokens,908.704351,False,0.0,False,908.704351 +6e47495f-ed54-4bc7-b158-cb6f94028488,claude-sonnet-4-20250514,anthropic,feal-linear-cryptanalysis,22429,16192,38621,1802.770913,False,0.0,claude-sonnet-4-20250514,feal-linear-cryptanalysis,1802.770913,False,0.0,False,1802.770913 +6fb4566d-018c-4fa4-8a43-ce2db8257d10,claude-opus-4-1-20250805,anthropic,polyglot-rust-c,10721,10797,21518,900.502842,False,0.0,claude-opus-4-1-20250805,polyglot-rust-c,900.502842,False,0.0,False,900.502842 +3e4d3122-e7a6-40f3-8239-33e4e9706245,OpenAI/gpt-oss-20B,together_ai,db-wal-recovery,391,1456,1847,326.298205,False,0.0,OpenAI/gpt-oss-20B,db-wal-recovery,326.298205,False,0.0,False,326.298205 +01b691ca-923b-411d-9559-ab2dc1c12dea,gemini-2.5-pro,gemini,financial-document-processor,10417,4349,14766,463.530648,False,0.0,gemini-2.5-pro,financial-document-processor,463.530648,False,0.0,False,463.530648 +8c00bb8f-5bfd-4ff7-8c0c-966207be7589,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,train-fasttext,16731,7517,24248,2789.764409,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,train-fasttext,2789.764409,False,0.0,False,2789.764409 +baa7af25-5148-4ef8-b191-e85a7343bd34,gpt-5-mini,openai,reshard-c4-data,4745,5649,10394,763.051196,False,0.0,gpt-5-mini,reshard-c4-data,763.051196,False,0.0,False,763.051196 +f7be1a8a-e68e-45d6-a540-1c50e2a391a1,gpt-5,openai,feal-differential-cryptanalysis,9470,9014,18484,982.667163,False,0.0,gpt-5,feal-differential-cryptanalysis,982.667163,False,0.0,False,982.667163 +4942d5c3-b892-4a38-a37b-8b5db6d04d8b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,git-leak-recovery,2478,2133,4611,347.120535,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,git-leak-recovery,347.120535,True,1.0,True,347.120535 +2a304c8f-ce37-449c-a47d-11d081360303,deepseek-ai/DeepSeek-V3.1,together_ai,filter-js-from-html,2189,1761,3950,155.615752,False,0.0,deepseek-ai/DeepSeek-V3.1,filter-js-from-html,155.615752,False,0.0,False,155.615752 +19b899fb-4901-4c1b-99f3-298517133102,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,schemelike-metacircular-eval,10433,7236,17669,521.083524,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,schemelike-metacircular-eval,521.083524,False,0.0,False,521.083524 +00a11fa8-017d-4c21-937d-fcab17c00c82,deepseek-ai/DeepSeek-V3.1,together_ai,log-summary-date-ranges,7838,2207,10045,144.934484,False,0.0,deepseek-ai/DeepSeek-V3.1,log-summary-date-ranges,144.934484,False,0.4,False,144.934484 +97274735-5ad9-422f-bd69-18a5f51b5ce8,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-with-gcov,10218,2153,12371,233.986976,False,0.0,deepseek-ai/DeepSeek-V3.1,sqlite-with-gcov,233.986976,False,0.8,False,233.986976 +04bfb531-0353-4cb7-af04-2f13eed81753,gpt-5,openai,video-processing,5676,4917,10593,326.26183,False,0.0,gpt-5,video-processing,326.26183,False,0.0,False,326.26183 +baaec447-920a-48d3-8def-6d7e74554e17,grok-code-fast-1,xai,qemu-startup,951,520,1471,77.342413,False,0.0,grok-code-fast-1,qemu-startup,77.342413,False,0.0,False,77.342413 +110ceb01-9bb6-4ee9-a536-3befcdc6dfaf,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-cli,7683,7608,15291,519.175958,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-cli,519.175958,False,0.0,False,519.175958 +b902b60d-2196-4af3-885d-3eb23731e073,zai-org/GLM-4.5-Air-FP8,together_ai,schemelike-metacircular-eval,33937,34645,68582,1214.766976,False,0.0,zai-org/GLM-4.5-Air-FP8,schemelike-metacircular-eval,1214.766976,False,0.0,False,1214.766976 +778d0912-eb5d-4fbd-9e64-1536cd1b248d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,video-processing,3636,2883,6519,191.416571,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,video-processing,191.416571,False,0.0,False,191.416571 +3875e65f-eafe-4a9f-aba6-30cab2c32547,OpenAI/gpt-oss-20B,together_ai,openssl-selfsigned-cert,1103,203,1306,14.464017,False,0.0,OpenAI/gpt-oss-20B,openssl-selfsigned-cert,14.464017,False,0.2,False,14.464017 +26777cb4-a28f-463a-a1d1-d98648b3805a,gpt-5-mini,openai,vulnerable-secret,17262,9136,26398,810.772388,True,1.0,gpt-5-mini,vulnerable-secret,810.772388,True,0.4,True,810.772388 +4b1d74f6-94ca-45fd-8ce6-c34ef716ed70,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,wasm-pipeline,2102,2190,4292,86.213469,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,wasm-pipeline,86.213469,False,0.0,False,86.213469 +0d0d1e25-9944-4d83-bfc5-0f1630e89e53,gemini-2.5-flash,gemini,sqlite-db-truncate,3591,2155,5746,696.936867,False,0.0,gemini-2.5-flash,sqlite-db-truncate,696.936867,False,0.0,False,696.936867 +b9d3c095-47bb-4b34-9e26-057d532b1467,gemini-2.5-pro,gemini,mteb-retrieve,2179,1085,3264,151.384585,False,0.0,gemini-2.5-pro,mteb-retrieve,151.384585,False,0.0,False,151.384585 +d5e22f1c-526e-425d-b8db-f69bcc7836bf,grok-4-0709,xai,code-from-image,7589,3612,11201,1209.333347,False,0.0,grok-4-0709,code-from-image,1209.333347,False,0.0,False,1209.333347 +6687c461-5cb3-4b45-aac0-7902384f48d3,claude-sonnet-4-20250514,anthropic,mteb-leaderboard,962,501,1463,160.061072,False,0.0,claude-sonnet-4-20250514,mteb-leaderboard,160.061072,False,0.0,False,160.061072 +0cfdc9ce-edfb-46c0-b7d3-67e1f4d08736,grok-4-0709,xai,distribution-search,2014,1006,3020,455.419628,True,1.0,grok-4-0709,distribution-search,455.419628,True,0.4,True,455.419628 +47f85501-bf1c-4cab-9bcb-7ae60f184f2c,claude-opus-4-1-20250805,anthropic,path-tracing,19707,14207,33914,1811.064664,False,0.0,claude-opus-4-1-20250805,path-tracing,1811.064664,False,0.0,False,1811.064664 +4cd74840-f383-42ca-b550-aaec276bceff,zai-org/GLM-4.5-Air-FP8,together_ai,circuit-fibsqrt,24822,29491,54313,1594.485598,False,0.0,zai-org/GLM-4.5-Air-FP8,circuit-fibsqrt,1594.485598,False,0.0,False,1594.485598 +92ee607c-d2de-4065-9f06-7aa0eb79dbf3,claude-opus-4-1-20250805,anthropic,pypi-server,5150,2590,7740,331.972522,True,1.0,claude-opus-4-1-20250805,pypi-server,331.972522,True,1.0,True,331.972522 +2a1ffe06-9243-4547-a979-859aa768204b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,largest-eigenval,8591,3760,12351,299.38884,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,largest-eigenval,299.38884,False,0.0,False,299.38884 +42792c29-5e49-4367-80f8-2d7a357c5537,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,form-filling,8767,7398,16165,478.692785,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,form-filling,478.692785,True,0.8,True,478.692785 +01d83249-77ec-4931-b12b-4805b6ea004b,moonshotai/Kimi-K2-Instruct-0905,together_ai,git-leak-recovery,2514,2378,4892,169.975227,True,1.0,moonshotai/Kimi-K2-Instruct-0905,git-leak-recovery,169.975227,True,1.0,True,169.975227 +0c8edb4d-8499-42d7-9ed9-3afa993aad58,zai-org/GLM-4.5-Air-FP8,together_ai,schemelike-metacircular-eval,22915,24781,47696,2428.692674,False,0.0,zai-org/GLM-4.5-Air-FP8,schemelike-metacircular-eval,2428.692674,False,0.0,False,2428.692674 +07929289-c988-4c7d-bed9-2e2cb0248511,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-recovery,8757,6023,14780,751.309458,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-recovery,751.309458,True,0.8,True,751.309458 +614fbc14-f301-4bef-bd3b-ab65e6b16d17,claude-opus-4-1-20250805,anthropic,form-filling,5874,4298,10172,253.895368,True,1.0,claude-opus-4-1-20250805,form-filling,253.895368,True,1.0,True,253.895368 +ecf2f8d3-2b98-4f2a-b906-c4307443caa8,deepseek-ai/DeepSeek-V3.1,together_ai,cancel-async-tasks,1825,1109,2934,28.96675,False,0.0,deepseek-ai/DeepSeek-V3.1,cancel-async-tasks,28.96675,False,0.4,False,28.96675 +423b3398-db3b-4d1f-82ba-98e9b3080dd3,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-cython-ext,8103,3559,11662,902.134841,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-cython-ext,902.134841,False,0.0,False,902.134841 +b04e852e-417c-454f-a9f3-d281597c5bb9,gpt-5,openai,cobol-modernization,6337,3847,10184,217.411476,True,1.0,gpt-5,cobol-modernization,217.411476,True,1.0,True,217.411476 +6265fc34-cc3b-44a7-a5e2-97e10bb3282c,deepseek-ai/DeepSeek-V3.1,together_ai,large-scale-text-editing,6449,5246,11695,337.414913,False,0.0,deepseek-ai/DeepSeek-V3.1,large-scale-text-editing,337.414913,False,0.0,False,337.414913 +a9c1c270-64db-46e1-86be-a3eebea2218e,deepseek-ai/DeepSeek-V3.1,together_ai,sanitize-git-repo,20505,5529,26034,802.64853,False,0.0,deepseek-ai/DeepSeek-V3.1,sanitize-git-repo,802.64853,False,0.0,False,802.64853 +8644ac58-6bd4-4dbf-a75d-043cb36770ac,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-db-truncate,4946,3706,8652,198.093197,False,0.0,zai-org/GLM-4.5-Air-FP8,sqlite-db-truncate,198.093197,False,0.0,False,198.093197 +6e87e728-0f70-4f4e-88ef-4f417b654a90,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,extract-elf,3564,2562,6126,274.899049,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,extract-elf,274.899049,False,0.0,False,274.899049 +bd0c604e-2fcc-4b5e-bdb6-d66b4f06d8e9,gpt-5-mini,openai,git-leak-recovery,7941,7312,15253,768.21181,False,0.0,gpt-5-mini,git-leak-recovery,768.21181,False,0.0,False,768.21181 +4cd4fa16-cdc0-4013-ab0e-e535fec3386f,gemini-2.5-pro,gemini,pypi-server,6416,3271,9687,511.302286,True,1.0,gemini-2.5-pro,pypi-server,511.302286,True,0.8,True,511.302286 +60563665-81a2-4c58-9559-9e6948a1f35b,claude-opus-4-1-20250805,anthropic,log-summary-date-ranges,7660,1919,9579,160.536924,True,1.0,claude-opus-4-1-20250805,log-summary-date-ranges,160.536924,True,0.8888888888888888,True,160.536924 +38bcfac2-4b53-40da-911a-4a7aa19fde6e,claude-opus-4-1-20250805,anthropic,train-fasttext,25336,12811,38147,3600.000711,False,0.0,claude-opus-4-1-20250805,train-fasttext,3600.000711,False,0.2857142857142857,False,3600.000711 +3d5d2d0f-2e5c-47c9-8ab0-38639b16fb49,gpt-5-mini,openai,polyglot-rust-c,1885,2187,4072,440.595907,False,0.0,gpt-5-mini,polyglot-rust-c,440.595907,False,0.0,False,440.595907 +565044c7-181f-42a0-a98f-2447832364f3,zai-org/GLM-4.5-Air-FP8,together_ai,hf-model-inference,5087,3765,8852,401.206725,True,1.0,zai-org/GLM-4.5-Air-FP8,hf-model-inference,401.206725,True,0.8,True,401.206725 +9e3c93af-92f8-4104-ae4d-cb74402303e3,claude-sonnet-4-20250514,anthropic,password-recovery,3437,3643,7080,475.896713,False,0.0,claude-sonnet-4-20250514,password-recovery,475.896713,False,0.4,False,475.896713 +932c3ea9-fbf9-42dc-8a74-5e3835f88734,gpt-5-mini,openai,financial-document-processor,21250,12341,33591,1200.544146,False,0.0,gpt-5-mini,financial-document-processor,1200.544146,False,0.0,False,1200.544146 +b9c5b36a-db33-4a34-ae6e-09ec5e5939cd,gpt-5-mini,openai,build-initramfs-qemu,4942,4201,9143,900.568735,False,0.0,gpt-5-mini,build-initramfs-qemu,900.568735,False,0.0,False,900.568735 +78cd3ea7-1c3d-4adf-ac00-290cbf33e7b6,gemini-2.5-pro,gemini,password-recovery,7986,5507,13493,933.364235,False,0.0,gemini-2.5-pro,password-recovery,933.364235,False,0.0,False,933.364235 +7151285d-ca87-4f88-a1da-731b3a7e85fb,claude-opus-4-1-20250805,anthropic,configure-git-webserver,6399,1926,8325,416.718266,True,1.0,claude-opus-4-1-20250805,configure-git-webserver,416.718266,True,0.625,True,416.718266 +559da0f5-1237-48be-b18a-fe0e36660886,openai/gpt-oss-120b,together_ai,dna-assembly,5754,1782,7536,171.88872,False,0.0,openai/gpt-oss-120b,dna-assembly,171.88872,False,0.0,False,171.88872 +dd610535-9494-4088-8663-f97f44054c1b,gpt-5-mini,openai,winning-avg-corewars,23445,20647,44092,3607.859696,False,0.0,gpt-5-mini,winning-avg-corewars,3607.859696,False,0.0,False,3607.859696 +73d81b14-c1fa-447a-9639-7347d2656249,gemini-2.5-pro,gemini,form-filling,6200,5293,11493,298.99749,False,0.0,gemini-2.5-pro,form-filling,298.99749,False,0.2,False,298.99749 +45fb27e2-e098-4c09-b6c6-1f1c99f0323f,OpenAI/gpt-oss-20B,together_ai,mteb-retrieve,984,2399,3383,163.02571,False,0.0,OpenAI/gpt-oss-20B,mteb-retrieve,163.02571,False,0.0,False,163.02571 +683d4f59-6d7f-422d-a42b-0a726b65423e,OpenAI/gpt-oss-20B,together_ai,extract-elf,168,1030,1198,143.858656,False,0.0,OpenAI/gpt-oss-20B,extract-elf,143.858656,False,0.2,False,143.858656 +f20a9116-c776-419b-abad-2d1964329e2f,grok-4-0709,xai,mteb-retrieve,1712,1153,2865,283.055218,False,0.0,grok-4-0709,mteb-retrieve,283.055218,False,0.0,False,283.055218 +764ea5e2-dd54-45fd-8bc7-5525451330d9,claude-sonnet-4-20250514,anthropic,openssl-selfsigned-cert,4128,3153,7281,292.147122,True,1.0,claude-sonnet-4-20250514,openssl-selfsigned-cert,292.147122,True,0.8,True,292.147122 +461e9c0b-d5bd-4190-9776-b621a9e8c217,claude-opus-4-1-20250805,anthropic,hf-model-inference,9411,5109,14520,467.603847,False,0.0,claude-opus-4-1-20250805,hf-model-inference,467.603847,False,0.25,False,467.603847 +962d07e7-d0f8-4c21-899a-64c2684d4d5f,claude-opus-4-1-20250805,anthropic,nginx-request-logging,5158,2411,7569,100.328306,True,1.0,claude-opus-4-1-20250805,nginx-request-logging,100.328306,True,1.0,True,100.328306 +5bd5fbb1-5125-4fac-9abe-04feb78059e5,moonshotai/Kimi-K2-Instruct-0905,together_ai,hf-model-inference,7851,6102,13953,683.018879,False,0.0,moonshotai/Kimi-K2-Instruct-0905,hf-model-inference,683.018879,False,0.0,False,683.018879 +09810eb0-c4a3-4d74-a503-3ff019dc2d56,claude-sonnet-4-20250514,anthropic,openssl-selfsigned-cert,4427,3559,7986,166.601485,True,1.0,claude-sonnet-4-20250514,openssl-selfsigned-cert,166.601485,True,0.8,True,166.601485 +3acd3c36-8da2-4cb2-b6c3-78e51ad977d3,claude-opus-4-1-20250805,anthropic,bn-fit-modify,12522,6293,18815,709.066568,True,1.0,claude-opus-4-1-20250805,bn-fit-modify,709.066568,True,0.875,True,709.066568 +4ae2c74c-06d1-463d-9b19-bf60401c71fa,gemini-2.5-pro,gemini,code-from-image,5959,1858,7817,279.766914,True,1.0,gemini-2.5-pro,code-from-image,279.766914,True,1.0,True,279.766914 +6bb19af1-6995-41e3-bb84-0f7cf04ebf22,zai-org/GLM-4.5-Air-FP8,together_ai,build-pmars,13997,8438,22435,671.288101,False,0.0,zai-org/GLM-4.5-Air-FP8,build-pmars,671.288101,False,0.6,False,671.288101 +b93a28df-aa0a-443c-8e85-9196b91259a1,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-git,6342,3584,9926,566.232465,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-git,566.232465,True,1.0,True,566.232465 +d1563f30-58e4-472c-8888-d9dde2c6ecb3,gemini-2.5-flash,gemini,build-initramfs-qemu,2769,2086,4855,315.570178,False,0.0,gemini-2.5-flash,build-initramfs-qemu,315.570178,False,0.0,False,315.570178 +77a76ef4-1645-4147-ab67-54cf6e6b9164,gpt-5-nano,openai,form-filling,4822,3146,7968,416.223106,True,1.0,gpt-5-nano,form-filling,416.223106,True,0.6,True,416.223106 +219314c6-3848-4ad1-9449-c6fbe06e5f82,openai/gpt-oss-120b,together_ai,gpt2-codegolf,2877,7048,9925,608.671783,False,0.0,openai/gpt-oss-120b,gpt2-codegolf,608.671783,False,0.0,False,608.671783 +583c8ec8-67df-453b-906f-ce43f79d7799,gpt-5,openai,cancel-async-tasks,1783,1148,2931,129.744433,True,1.0,gpt-5,cancel-async-tasks,129.744433,True,0.6,True,129.744433 +38a2f1fc-0a22-4cac-bf70-5a68310607aa,zai-org/GLM-4.5-Air-FP8,together_ai,build-pov-ray,14626,11196,25822,1701.299445,False,0.0,zai-org/GLM-4.5-Air-FP8,build-pov-ray,1701.299445,False,0.0,False,1701.299445 +226a31d3-0056-476c-a5d3-25a53d667a34,claude-opus-4-1-20250805,anthropic,polyglot-c-py,1716,1541,3257,413.786451,False,0.0,claude-opus-4-1-20250805,polyglot-c-py,413.786451,False,0.0,False,413.786451 +af895e31-122e-4263-bbe1-13d5904723a8,gpt-5-mini,openai,filter-js-from-html,2479,2616,5095,126.025126,False,0.0,gpt-5-mini,filter-js-from-html,126.025126,False,0.0,False,126.025126 +fa6a4c84-53ba-4db3-9a2b-93f90c51c384,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sanitize-git-repo,9903,3419,13322,685.862373,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sanitize-git-repo,685.862373,False,0.0,False,685.862373 +20385de8-e4a0-454d-a96b-0ebc7c58f009,zai-org/GLM-4.5-Air-FP8,together_ai,make-mips-interpreter,24682,17511,42193,2101.725902,False,0.0,zai-org/GLM-4.5-Air-FP8,make-mips-interpreter,2101.725902,False,0.0,False,2101.725902 +1acf53de-645b-44d6-b21a-b341b97f795c,claude-opus-4-1-20250805,anthropic,polyglot-rust-c,9957,9111,19068,900.685443,False,0.0,claude-opus-4-1-20250805,polyglot-rust-c,900.685443,False,0.0,False,900.685443 +80cbfbe0-3393-477c-a13f-21a2753d2ce5,claude-opus-4-1-20250805,anthropic,regex-log,3500,2853,6353,302.706542,False,0.0,claude-opus-4-1-20250805,regex-log,302.706542,False,0.5714285714285714,False,302.706542 +e617cf75-8156-4ae3-bb0d-683be8e2e998,gemini-2.5-pro,gemini,build-pmars,16424,3169,19593,630.295473,True,1.0,gemini-2.5-pro,build-pmars,630.295473,True,1.0,True,630.295473 +a8a7114f-cac2-477b-9042-4012a0240cbc,openai/gpt-oss-120b,together_ai,build-initramfs-qemu,10520,10057,20577,916.297652,False,0.0,openai/gpt-oss-120b,build-initramfs-qemu,916.297652,False,0.0,False,916.297652 +387a5334-b5d8-47ca-a0fa-6cd76ae1a07f,claude-opus-4-1-20250805,anthropic,feal-linear-cryptanalysis,18484,16764,35248,1802.532733,False,0.0,claude-opus-4-1-20250805,feal-linear-cryptanalysis,1802.532733,False,0.0,False,1802.532733 +106afd33-2aac-4f17-8d8f-198342f7bde5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,tune-mjcf,4441,3463,7904,224.108556,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,tune-mjcf,224.108556,False,0.0,False,224.108556 +eb2121a9-fbec-469f-8ce0-0747a2c8bb2a,grok-code-fast-1,xai,path-tracing,2027,1730,3757,104.654786,False,0.0,grok-code-fast-1,path-tracing,104.654786,False,0.0,False,104.654786 +c901c141-be15-477b-90d4-938d0b4e7323,gemini-2.5-flash,gemini,mteb-retrieve,1878,932,2810,171.517033,False,0.0,gemini-2.5-flash,mteb-retrieve,171.517033,False,0.0,False,171.517033 +5b739d6d-1a5d-496b-aafe-cc66ef911032,zai-org/GLM-4.5-Air-FP8,together_ai,tune-mjcf,23546,17299,40845,900.470388,False,0.0,zai-org/GLM-4.5-Air-FP8,tune-mjcf,900.470388,False,0.0,False,900.470388 +d41b4881-05a7-4148-8d96-3f044bcce710,moonshotai/Kimi-K2-Instruct-0905,together_ai,train-fasttext,18244,10645,28889,1825.768686,False,0.0,moonshotai/Kimi-K2-Instruct-0905,train-fasttext,1825.768686,False,0.2,False,1825.768686 +86fde7dd-f8b4-4551-8c4a-ca07e17eead1,gemini-2.5-flash,gemini,filter-js-from-html,1202,8522,9724,912.106816,False,0.0,gemini-2.5-flash,filter-js-from-html,912.106816,False,0.0,False,912.106816 +9c6dd741-2410-4197-a925-044d060d9720,gpt-5-nano,openai,db-wal-recovery,5639,6772,12411,911.419391,False,0.0,gpt-5-nano,db-wal-recovery,911.419391,False,0.0,False,911.419391 +7c66b406-eadb-4ca1-b515-3e08e6ce862e,gpt-5,openai,reverse-engineering,14640,7293,21933,606.120466,True,1.0,gpt-5,reverse-engineering,606.120466,True,0.6666666666666666,True,606.120466 +1d2e5304-d74f-4073-aa5f-9c3a9743d2d6,deepseek-ai/DeepSeek-V3.1,together_ai,form-filling,8838,6898,15736,433.218726,True,1.0,deepseek-ai/DeepSeek-V3.1,form-filling,433.218726,True,0.8,True,433.218726 +77daed4f-a7a5-4e5b-8ff7-6cc5a9746454,claude-opus-4-1-20250805,anthropic,constraints-scheduling,4988,3376,8364,109.424085,True,1.0,claude-opus-4-1-20250805,constraints-scheduling,109.424085,True,0.8888888888888888,True,109.424085 +2f3f2560-34ef-4277-97af-b49f16738bd8,gemini-2.5-flash,gemini,db-wal-recovery,7065,20432,27497,907.301296,False,0.0,gemini-2.5-flash,db-wal-recovery,907.301296,False,0.0,False,907.301296 +622b84b3-7a4e-4b5e-8804-c81199a26874,gemini-2.5-pro,gemini,feal-differential-cryptanalysis,4336,4784,9120,751.377285,False,0.0,gemini-2.5-pro,feal-differential-cryptanalysis,751.377285,False,0.6,False,751.377285 +32f6148f-d383-401c-873e-bca2ba8a7afe,grok-code-fast-1,xai,gpt2-codegolf,1642,1353,2995,159.615188,False,0.0,grok-code-fast-1,gpt2-codegolf,159.615188,False,0.0,False,159.615188 +34b25c45-b0ba-4f79-9f03-e9270de7ec2c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,schemelike-metacircular-eval,37717,20271,57988,1564.096975,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,schemelike-metacircular-eval,1564.096975,False,0.0,False,1564.096975 +d2bbee39-1247-4ccc-9029-fb321b3ea40b,grok-4-0709,xai,install-windows-3.11,14175,4724,18899,1085.602217,False,0.0,grok-4-0709,install-windows-3.11,1085.602217,False,0.0,False,1085.602217 +b20a0562-1294-4e4d-8551-9879a2ce9aff,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,constraints-scheduling,8926,9714,18640,674.796837,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,constraints-scheduling,674.796837,True,1.0,True,674.796837 +582e389d-1c75-407d-8a52-ec9f34d09591,gpt-5,openai,configure-git-webserver,5575,2162,7737,367.7218,True,1.0,gpt-5,configure-git-webserver,367.7218,True,1.0,True,367.7218 +15aead98-2744-4c83-ba52-3e1ff732c594,gpt-5,openai,cancel-async-tasks,1936,1312,3248,441.621822,True,1.0,gpt-5,cancel-async-tasks,441.621822,True,0.6,True,441.621822 +1fc36c0c-9446-4d39-885e-efa9318ddf08,OpenAI/gpt-oss-20B,together_ai,log-summary-date-ranges,1491,2185,3676,70.176661,False,0.0,OpenAI/gpt-oss-20B,log-summary-date-ranges,70.176661,False,0.0,False,70.176661 +2a577057-8f4d-4baf-8141-afd3b3311534,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-linear-cryptanalysis,18672,14359,33031,1830.016618,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-linear-cryptanalysis,1830.016618,False,0.0,False,1830.016618 +26984e19-0f0e-40c4-876e-0edaef947c3a,deepseek-ai/DeepSeek-V3.1,together_ai,reverse-engineering,23304,15297,38601,1826.775972,False,0.0,deepseek-ai/DeepSeek-V3.1,reverse-engineering,1826.775972,False,0.2,False,1826.775972 +270204a5-fa6b-42a4-b9cf-cd7843a286fa,moonshotai/Kimi-K2-Instruct-0905,together_ai,write-compressor,12996,13564,26560,900.032755,False,0.0,moonshotai/Kimi-K2-Instruct-0905,write-compressor,900.032755,False,0.0,False,900.032755 +1e1257c2-0bc8-4762-881e-cf7fab034b48,claude-sonnet-4-20250514,anthropic,break-filter-js-from-html,10543,10217,20760,1220.919695,False,0.0,claude-sonnet-4-20250514,break-filter-js-from-html,1220.919695,False,0.0,False,1220.919695 +f77a0798-df34-4780-9760-8a0e9238c37b,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-assembly,11512,7245,18757,744.495063,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-assembly,744.495063,False,0.0,False,744.495063 +5118648f-de26-4aff-8431-44add62f6a71,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,write-compressor,5298,5121,10419,357.40933,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,write-compressor,357.40933,False,0.0,False,357.40933 +2add1490-1465-49a4-bafc-b9b1c19f266b,OpenAI/gpt-oss-20B,together_ai,crack-7z-hash,1101,360,1461,12.386415,False,0.0,OpenAI/gpt-oss-20B,crack-7z-hash,12.386415,False,0.0,False,12.386415 +bbbcde4e-4818-4fdd-b157-8308131ad128,claude-opus-4-1-20250805,anthropic,model-extraction-relu-logits,3777,2641,6418,584.547492,False,0.0,claude-opus-4-1-20250805,model-extraction-relu-logits,584.547492,False,0.0,False,584.547492 +d3d2d894-f879-4c43-93bc-6304b67ee4c5,deepseek-ai/DeepSeek-V3.1,together_ai,cobol-modernization,5153,3293,8446,915.780992,True,1.0,deepseek-ai/DeepSeek-V3.1,cobol-modernization,915.780992,True,0.6,True,915.780992 +0167e4f1-558a-499f-b095-933391437034,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,password-recovery,5334,5006,10340,910.24323,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,password-recovery,910.24323,False,0.2,False,910.24323 +e18682a6-1072-4f7f-9fda-a91471928efb,grok-4-0709,xai,path-tracing,10245,3711,13956,1800.08514,False,0.0,grok-4-0709,path-tracing,1800.08514,False,0.0,False,1800.08514 +b7bfafc2-a9ba-4789-bc08-8fca0843559d,deepseek-ai/DeepSeek-V3.1,together_ai,wasm-pipeline,4491,5774,10265,661.050241,True,1.0,deepseek-ai/DeepSeek-V3.1,wasm-pipeline,661.050241,True,0.4,True,661.050241 +a49fb737-4705-462a-96f3-1544614fa7cc,OpenAI/gpt-oss-20B,together_ai,fix-code-vulnerability,2805,8787,11592,900.024056,False,0.0,OpenAI/gpt-oss-20B,fix-code-vulnerability,900.024056,False,0.0,False,900.024056 +52b8dfa7-4997-40ee-b92b-18d6dea22fdc,gpt-5,openai,sqlite-with-gcov,4578,1347,5925,334.186121,True,1.0,gpt-5,sqlite-with-gcov,334.186121,True,0.3333333333333333,True,334.186121 +647be2a0-189c-4619-bb02-51c65e5199bd,claude-opus-4-1-20250805,anthropic,financial-document-processor,8986,2988,11974,318.867634,False,0.0,claude-opus-4-1-20250805,financial-document-processor,318.867634,False,0.0,False,318.867634 +e075940b-9c24-46d5-9b9c-959893b67c63,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing,3118,2745,5863,450.005837,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing,450.005837,False,0.0,False,450.005837 +3bd06a7a-8261-4383-a026-279a27170652,zai-org/GLM-4.5-Air-FP8,together_ai,nginx-request-logging,5087,3895,8982,580.678413,True,1.0,zai-org/GLM-4.5-Air-FP8,nginx-request-logging,580.678413,True,1.0,True,580.678413 +3f097312-f313-44f8-a08e-d0b3be32473b,OpenAI/gpt-oss-20B,together_ai,feal-differential-cryptanalysis,1565,4018,5583,180.345809,False,0.0,OpenAI/gpt-oss-20B,feal-differential-cryptanalysis,180.345809,False,0.0,False,180.345809 +5d8b5329-94db-490f-9f86-9e4965f82d75,zai-org/GLM-4.5-Air-FP8,together_ai,count-dataset-tokens,9859,3726,13585,246.060796,False,0.0,zai-org/GLM-4.5-Air-FP8,count-dataset-tokens,246.060796,False,0.0,False,246.060796 +dddf66b4-b8fa-4885-a243-af8664b6dba6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-mips-interpreter,21280,13022,34302,1350.749868,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-mips-interpreter,1350.749868,False,0.0,False,1350.749868 +092edccd-2bd3-4795-9f3b-33370ee33590,grok-code-fast-1,xai,model-extraction-relu-logits,1297,569,1866,79.757427,False,0.0,grok-code-fast-1,model-extraction-relu-logits,79.757427,False,0.0,False,79.757427 +ebbfbed3-c4d8-4a8f-8a9c-ecf733f3dc47,OpenAI/gpt-oss-20B,together_ai,distribution-search,214,2439,2653,134.236845,False,0.0,OpenAI/gpt-oss-20B,distribution-search,134.236845,False,0.0,False,134.236845 +b75991f1-a1a4-49b8-a79d-fda46a16dd79,gpt-5,openai,bn-fit-modify,9680,10749,20429,893.268747,True,1.0,gpt-5,bn-fit-modify,893.268747,True,0.5,True,893.268747 +924eeac1-571a-4f91-b076-8f7448c6cc8e,openai/gpt-oss-120b,together_ai,sqlite-db-truncate,2811,3037,5848,902.514742,False,0.0,openai/gpt-oss-120b,sqlite-db-truncate,902.514742,False,0.0,False,902.514742 +92836f0d-83b3-4aa7-ade3-4b3a007e7174,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-recovery,7766,4053,11819,176.558374,True,1.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-recovery,176.558374,True,0.6,True,176.558374 +9cf8b8a1-8103-43ff-9678-b5f38e2f9192,claude-opus-4-1-20250805,anthropic,merge-diff-arc-agi-task,10506,4676,15182,905.644947,False,0.0,claude-opus-4-1-20250805,merge-diff-arc-agi-task,905.644947,False,0.3333333333333333,False,905.644947 +0a58d159-718f-4974-abec-71ffa805d259,gemini-2.5-pro,gemini,torch-tensor-parallelism,2077,1856,3933,131.577036,False,0.0,gemini-2.5-pro,torch-tensor-parallelism,131.577036,False,0.0,False,131.577036 +cc328a2b-99c8-495c-9e9d-7b068f72e158,claude-sonnet-4-20250514,anthropic,mteb-retrieve,2579,1899,4478,232.474923,False,0.0,claude-sonnet-4-20250514,mteb-retrieve,232.474923,False,0.0,False,232.474923 +1e29b6ac-8a25-440a-9514-d027b295442b,gpt-5,openai,pytorch-model-recovery,12156,12854,25010,900.003088,False,0.0,gpt-5,pytorch-model-recovery,900.003088,False,0.4285714285714285,False,900.003088 +7bd97228-02ee-4869-96a4-158daa667939,gpt-5-mini,openai,filter-js-from-html,3692,2731,6423,286.460354,False,0.0,gpt-5-mini,filter-js-from-html,286.460354,False,0.0,False,286.460354 +d7af7174-d4be-4866-9e6e-959bfaedf1b8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-alpine-ssh,4597,5393,9990,916.920913,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-alpine-ssh,916.920913,False,0.2,False,916.920913 +86ae226e-e887-4b5e-8180-749d1d2bfc54,OpenAI/gpt-oss-20B,together_ai,filter-js-from-html,1506,879,2385,12.630612,False,0.0,OpenAI/gpt-oss-20B,filter-js-from-html,12.630612,False,0.0,False,12.630612 +9a199c5d-afac-411f-a125-81d884303cc8,gemini-2.5-pro,gemini,pytorch-model-cli,3827,3438,7265,359.02534,False,0.0,gemini-2.5-pro,pytorch-model-cli,359.02534,False,0.4,False,359.02534 +f8b7fbb3-a2fc-4501-b10d-38fb307a3fc5,grok-4-0709,xai,path-tracing-reverse,6513,9605,16118,1832.513526,False,0.0,grok-4-0709,path-tracing-reverse,1832.513526,False,0.0,False,1832.513526 +1dfcc15f-dbef-4f83-b13f-e6b695ff212a,zai-org/GLM-4.5-Air-FP8,together_ai,large-scale-text-editing,8230,9298,17528,1212.510062,False,0.0,zai-org/GLM-4.5-Air-FP8,large-scale-text-editing,1212.510062,False,0.0,False,1212.510062 +ac7092e1-59c8-4211-a7e5-0f0068280fc1,claude-sonnet-4-20250514,anthropic,count-dataset-tokens,12229,4558,16787,326.745536,False,0.0,claude-sonnet-4-20250514,count-dataset-tokens,326.745536,False,0.0,False,326.745536 +e6aec74e-ef43-4284-aaab-941e2deb72a0,grok-4-0709,xai,sparql-university,4907,1194,6101,399.804394,False,0.0,grok-4-0709,sparql-university,399.804394,False,0.4,False,399.804394 +daf4b291-5ba1-4ed3-9636-cb7dccfda898,gpt-5-mini,openai,build-pmars,4524,2793,7317,2063.485858,False,0.0,gpt-5-mini,build-pmars,2063.485858,False,0.2,False,2063.485858 +3d7bd1b7-12e7-4b8f-b0ab-1977776a81e2,claude-sonnet-4-20250514,anthropic,fix-git,3661,2290,5951,184.343923,True,1.0,claude-sonnet-4-20250514,fix-git,184.343923,True,1.0,True,184.343923 +61985c81-214f-4a68-a27b-4a43a3fbb78e,gpt-5-mini,openai,build-initramfs-qemu,2011,2361,4372,135.585142,False,0.0,gpt-5-mini,build-initramfs-qemu,135.585142,False,0.0,False,135.585142 +28a0e44b-064b-4fb5-a137-3d2f86c548f6,gpt-5,openai,torch-tensor-parallelism,2646,3677,6323,513.068155,False,0.0,gpt-5,torch-tensor-parallelism,513.068155,False,0.0,False,513.068155 +84aa6535-9a4f-4791-aae2-b69f5a20c1fb,claude-sonnet-4-20250514,anthropic,password-recovery,5389,6868,12257,574.155521,False,0.0,claude-sonnet-4-20250514,password-recovery,574.155521,False,0.4,False,574.155521 +2126039e-fb03-4bdc-b5fb-bb77d6cbfe77,zai-org/GLM-4.5-Air-FP8,together_ai,winning-avg-corewars,4382,4872,9254,372.466426,False,0.0,zai-org/GLM-4.5-Air-FP8,winning-avg-corewars,372.466426,False,0.0,False,372.466426 +0e13e697-d4f5-4793-a157-a6aa3222e48a,claude-opus-4-1-20250805,anthropic,db-wal-recovery,7458,5903,13361,876.161393,False,0.0,claude-opus-4-1-20250805,db-wal-recovery,876.161393,False,0.0,False,876.161393 +5983b664-fe7c-49f3-9448-b5fa5545a56d,zai-org/GLM-4.5-Air-FP8,together_ai,make-mips-interpreter,19599,31233,50832,1802.970575,False,0.0,zai-org/GLM-4.5-Air-FP8,make-mips-interpreter,1802.970575,False,0.0,False,1802.970575 +2ea574ab-99de-4328-b1f0-1ab5cfb797fb,gpt-5-mini,openai,qemu-alpine-ssh,2325,2924,5249,401.584648,False,0.0,gpt-5-mini,qemu-alpine-ssh,401.584648,False,0.0,False,401.584648 +2db5ef23-ba6a-4401-bad6-0c2633e8ba49,gemini-2.5-pro,gemini,hf-model-inference,6559,2271,8830,900.775896,True,1.0,gemini-2.5-pro,hf-model-inference,900.775896,True,0.8,True,900.775896 +5c7e79ec-3666-4fdc-8728-a8deed40d238,gemini-2.5-pro,gemini,install-windows-3.11,6551,3019,9570,530.952951,False,0.0,gemini-2.5-pro,install-windows-3.11,530.952951,False,0.0,False,530.952951 +b6f560d3-deaa-4f3a-b992-31d217167d50,gpt-5-nano,openai,feal-linear-cryptanalysis,6140,21308,27448,1801.367497,False,0.0,gpt-5-nano,feal-linear-cryptanalysis,1801.367497,False,0.0,False,1801.367497 +ab82794a-3124-4596-bd81-d6fa1747519a,moonshotai/Kimi-K2-Instruct-0905,together_ai,pytorch-model-cli,8311,8599,16910,839.393672,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pytorch-model-cli,839.393672,False,0.0,False,839.393672 +c54620ba-5fde-47c0-a0d0-707b57e59589,moonshotai/Kimi-K2-Instruct-0905,together_ai,distribution-search,23272,18810,42082,1642.710512,False,0.0,moonshotai/Kimi-K2-Instruct-0905,distribution-search,1642.710512,False,0.2,False,1642.710512 +087e039f-7892-4f40-b99d-d15963c6294d,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-cli,5633,12703,18336,901.222718,False,0.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-cli,901.222718,False,0.0,False,901.222718 +3110eea4-e036-4e60-be14-5a47c5b6d9ab,grok-4-0709,xai,qemu-startup,7050,5059,12109,904.662798,False,0.0,grok-4-0709,qemu-startup,904.662798,False,0.4,False,904.662798 +86576d8c-6f2f-4603-8c6d-093454315e86,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,log-summary-date-ranges,5110,2251,7361,172.084493,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,log-summary-date-ranges,172.084493,False,0.0,False,172.084493 +4742659e-e25f-4c30-9da9-928a55c4abe5,claude-opus-4-1-20250805,anthropic,make-mips-interpreter,29701,23098,52799,2074.425933,False,0.0,claude-opus-4-1-20250805,make-mips-interpreter,2074.425933,False,0.0,False,2074.425933 +a5e689c1-171d-413d-8c92-bef40f6ae730,gpt-5-nano,openai,fix-git,10070,9258,19328,900.491035,False,0.0,gpt-5-nano,fix-git,900.491035,False,0.0,False,900.491035 +1f55ccc5-6b4a-405b-88eb-cd12d07484a6,gemini-2.5-flash,gemini,chess-best-move,10755,7611,18366,653.378282,False,0.0,gemini-2.5-flash,chess-best-move,653.378282,False,0.0,False,653.378282 +e0bff138-ed86-4280-af1f-9878992d0fd8,gpt-5-nano,openai,distribution-search,24584,29977,54561,3346.798907,False,0.0,gpt-5-nano,distribution-search,3346.798907,False,0.25,False,3346.798907 +517a614e-0f82-4994-9e44-f556732196a1,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,form-filling,9987,7411,17398,374.51275,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,form-filling,374.51275,True,0.8,True,374.51275 +03b30e27-1968-47c1-a5ab-5a79f4ed2070,OpenAI/gpt-oss-20B,together_ai,path-tracing,7202,27717,34919,1800.565119,False,0.0,OpenAI/gpt-oss-20B,path-tracing,1800.565119,False,0.0,False,1800.565119 +09096bf7-c0db-47c7-ac0c-956e1ed86948,gemini-2.5-flash,gemini,dna-assembly,12244,2552,14796,759.453596,False,0.0,gemini-2.5-flash,dna-assembly,759.453596,False,0.0,False,759.453596 +f1f8230d-cf05-4c87-b67a-b9ffe6236233,gpt-5,openai,merge-diff-arc-agi-task,9271,5889,15160,502.368781,True,1.0,gpt-5,merge-diff-arc-agi-task,502.368781,True,1.0,True,502.368781 +c329d066-2cdf-4f52-af72-b07fb06f3e3a,moonshotai/Kimi-K2-Instruct-0905,together_ai,filter-js-from-html,3593,2925,6518,579.247683,False,0.0,moonshotai/Kimi-K2-Instruct-0905,filter-js-from-html,579.247683,False,0.0,False,579.247683 +f99b4129-b499-4886-9549-d2951d24dc7b,deepseek-ai/DeepSeek-V3.1,together_ai,sparql-university,6715,2221,8936,721.252193,False,0.0,deepseek-ai/DeepSeek-V3.1,sparql-university,721.252193,False,0.0,False,721.252193 +4ec8a64f-1f87-4482-b9d3-044b2fb5b984,gemini-2.5-flash,gemini,tune-mjcf,4958,5064,10022,471.552013,True,1.0,gemini-2.5-flash,tune-mjcf,471.552013,True,0.6,True,471.552013 +bb446a9f-a960-4737-b8d6-6728783efad9,gemini-2.5-flash,gemini,merge-diff-arc-agi-task,7860,5215,13075,912.572668,False,0.0,gemini-2.5-flash,merge-diff-arc-agi-task,912.572668,False,0.0,False,912.572668 +29bb5dda-d5ab-4de6-bda7-8c5f7fc74c9a,claude-opus-4-1-20250805,anthropic,mteb-retrieve,2519,1606,4125,208.507572,False,0.0,claude-opus-4-1-20250805,mteb-retrieve,208.507572,False,0.0,False,208.507572 +0a0351d6-8b38-4172-a848-ae94a42cf371,grok-4-0709,xai,fix-git,1948,1560,3508,154.096906,True,1.0,grok-4-0709,fix-git,154.096906,True,1.0,True,154.096906 +ef762438-6043-4a42-a45a-b9b481840ac6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,port-compressor,40415,20157,60572,3600.471402,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,port-compressor,3600.471402,False,0.0,False,3600.471402 +f929d823-dee6-409e-9db1-d405031e0364,claude-sonnet-4-20250514,anthropic,train-fasttext,15776,4945,20721,1564.457289,False,0.0,claude-sonnet-4-20250514,train-fasttext,1564.457289,False,0.0,False,1564.457289 +0e5258c5-aa4f-43d2-bb3c-8e7fa1764fa6,grok-code-fast-1,xai,make-mips-interpreter,5446,17346,22792,1153.781232,False,0.0,grok-code-fast-1,make-mips-interpreter,1153.781232,False,0.0,False,1153.781232 +49e34070-2538-4290-b4f8-e0d41b4cf5bf,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,model-extraction-relu-logits,3384,4097,7481,1150.099171,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,model-extraction-relu-logits,1150.099171,False,0.0,False,1150.099171 +a5086497-24b6-4f1f-89f3-f685ebfdb916,deepseek-ai/DeepSeek-V3.1,together_ai,vulnerable-secret,1303,1248,2551,900.017554,False,0.0,deepseek-ai/DeepSeek-V3.1,vulnerable-secret,900.017554,False,0.4,False,900.017554 +24e5a5c8-a6fb-4a4d-a194-bcdc461d7e94,moonshotai/Kimi-K2-Instruct-0905,together_ai,break-filter-js-from-html,8225,9468,17693,1200.199585,False,0.0,moonshotai/Kimi-K2-Instruct-0905,break-filter-js-from-html,1200.199585,False,0.0,False,1200.199585 +58f64bdf-97eb-4227-91c2-31198d5cfe9d,OpenAI/gpt-oss-20B,together_ai,nginx-request-logging,1216,1713,2929,235.40418,False,0.0,OpenAI/gpt-oss-20B,nginx-request-logging,235.40418,False,0.0,False,235.40418 +0ea087ae-f546-49b5-b4ba-465a75adabe4,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sanitize-git-repo,2998,1444,4442,205.627928,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sanitize-git-repo,205.627928,False,0.0,False,205.627928 +362279f4-044f-4901-89ba-2da02544265a,gpt-5,openai,largest-eigenval,8329,7888,16217,913.914877,False,0.0,gpt-5,largest-eigenval,913.914877,False,0.0,False,913.914877 +c348ce81-3e52-4f5d-a78e-a9afecac119f,gpt-5-nano,openai,path-tracing-reverse,23751,19794,43545,1835.192355,False,0.0,gpt-5-nano,path-tracing-reverse,1835.192355,False,0.0,False,1835.192355 +4fcdd852-4c82-4729-b5cc-7762b7e288dc,claude-opus-4-1-20250805,anthropic,adaptive-rejection-sampler,12472,10407,22879,901.03392,False,0.0,claude-opus-4-1-20250805,adaptive-rejection-sampler,901.03392,False,0.125,False,901.03392 +4f557590-e84d-4199-82cb-3e8532328147,gpt-5-nano,openai,cancel-async-tasks,4675,4086,8761,664.885121,False,0.0,gpt-5-nano,cancel-async-tasks,664.885121,False,0.4,False,664.885121 +fde3398d-cc4c-414e-9a9d-6305304b8886,claude-opus-4-1-20250805,anthropic,code-from-image,37245,33900,71145,1200.002843,False,0.0,claude-opus-4-1-20250805,code-from-image,1200.002843,False,0.125,False,1200.002843 +81a5c951-9163-418e-b7d2-b1735d14a57a,deepseek-ai/DeepSeek-V3.1,together_ai,adaptive-rejection-sampler,13303,11716,25019,901.072124,False,0.0,deepseek-ai/DeepSeek-V3.1,adaptive-rejection-sampler,901.072124,False,0.2,False,901.072124 +b57d4fc9-d8d5-43d0-9d20-488b6ceff5c5,moonshotai/Kimi-K2-Instruct-0905,together_ai,configure-git-webserver,7859,4368,12227,592.978233,True,1.0,moonshotai/Kimi-K2-Instruct-0905,configure-git-webserver,592.978233,True,0.6,True,592.978233 +5a60ec64-138d-4db9-baaf-0ea2af61f9b3,gpt-5,openai,openssl-selfsigned-cert,2476,1346,3822,121.959776,True,1.0,gpt-5,openssl-selfsigned-cert,121.959776,True,1.0,True,121.959776 +8891dd1c-48f2-4c4c-ad0a-011b8107999d,OpenAI/gpt-oss-20B,together_ai,filter-js-from-html,1436,842,2278,30.840991,False,0.0,OpenAI/gpt-oss-20B,filter-js-from-html,30.840991,False,0.0,False,30.840991 +9ff8ef43-236f-4611-9c9d-28df1836433b,gemini-2.5-pro,gemini,qemu-startup,1260,1012,2272,106.833497,False,0.0,gemini-2.5-pro,qemu-startup,106.833497,False,0.2,False,106.833497 +0918ce2f-0772-4f77-95d3-0bc08cc319d1,moonshotai/Kimi-K2-Instruct-0905,together_ai,reshard-c4-data,9735,5741,15476,1786.932415,False,0.0,moonshotai/Kimi-K2-Instruct-0905,reshard-c4-data,1786.932415,False,0.0,False,1786.932415 +3e3dcfef-6336-46bd-ace0-0cc25bb10e8a,claude-opus-4-1-20250805,anthropic,tune-mjcf,16814,14846,31660,1008.545189,False,0.0,claude-opus-4-1-20250805,tune-mjcf,1008.545189,False,0.25,False,1008.545189 +f8061f3b-ea90-4563-99ec-cfffe1e2ecbb,gpt-5,openai,path-tracing-reverse,15024,15017,30041,1860.210053,False,0.0,gpt-5,path-tracing-reverse,1860.210053,False,0.0,False,1860.210053 +bddd6888-8633-4b27-aa57-3a331a7ff544,claude-opus-4-1-20250805,anthropic,write-compressor,12952,11196,24148,931.172761,False,0.0,claude-opus-4-1-20250805,write-compressor,931.172761,False,0.0,False,931.172761 +48de3f9d-ad90-4ce2-9e83-49b9fa08e635,gemini-2.5-flash,gemini,git-leak-recovery,1697,1944,3641,127.800433,False,0.0,gemini-2.5-flash,git-leak-recovery,127.800433,False,0.6,False,127.800433 +b16bec4f-7de1-4ee8-a6a0-1b6fd638b1dc,gemini-2.5-flash,gemini,winning-avg-corewars,13097,17612,30709,952.083953,False,0.0,gemini-2.5-flash,winning-avg-corewars,952.083953,False,0.0,False,952.083953 +9002e43e-163d-4f5b-aaf8-b199d55abd51,claude-sonnet-4-20250514,anthropic,tune-mjcf,13783,13351,27134,949.742623,False,0.0,claude-sonnet-4-20250514,tune-mjcf,949.742623,False,0.2,False,949.742623 +b5c07074-3df7-4b5d-ad8b-e16c1d69fe88,claude-opus-4-1-20250805,anthropic,build-cython-ext,13082,3867,16949,1106.463119,False,0.0,claude-opus-4-1-20250805,build-cython-ext,1106.463119,False,0.0,False,1106.463119 +3284c740-abed-4169-ba43-543fd7b71ec3,gemini-2.5-flash,gemini,sparql-university,6587,2199,8786,142.54112,False,0.0,gemini-2.5-flash,sparql-university,142.54112,False,0.0,False,142.54112 +938c8306-ea85-4b48-9a8f-13ffd6299616,moonshotai/Kimi-K2-Instruct-0905,together_ai,vulnerable-secret,10554,10575,21129,904.684933,False,0.0,moonshotai/Kimi-K2-Instruct-0905,vulnerable-secret,904.684933,False,0.2,False,904.684933 +4e9beb73-864a-45bd-91ab-fd5dbfce7627,gpt-5-nano,openai,tune-mjcf,6244,7936,14180,928.837663,False,0.0,gpt-5-nano,tune-mjcf,928.837663,False,0.0,False,928.837663 +447fa237-a571-4077-875a-0e06463593ca,OpenAI/gpt-oss-20B,together_ai,vulnerable-secret,414,1366,1780,154.991213,False,0.0,OpenAI/gpt-oss-20B,vulnerable-secret,154.991213,False,0.0,False,154.991213 +91d7ff78-9e8b-4bb6-be03-77ba1f88d54d,gemini-2.5-flash,gemini,model-extraction-relu-logits,4358,3952,8310,579.314233,False,0.0,gemini-2.5-flash,model-extraction-relu-logits,579.314233,False,0.2,False,579.314233 +c1c87db3-b5f9-47fe-9734-89478e1cbdd4,OpenAI/gpt-oss-20B,together_ai,nginx-request-logging,3711,1430,5141,87.401822,False,0.0,OpenAI/gpt-oss-20B,nginx-request-logging,87.401822,False,0.0,False,87.401822 +26388b9d-64e7-42c8-989d-79d21c95e205,gemini-2.5-pro,gemini,write-compressor,1537,706,2243,1454.964977,False,0.0,gemini-2.5-pro,write-compressor,1454.964977,False,0.0,False,1454.964977 +b7ecbc3c-5b5c-4eef-b2c2-ec3a3814483a,claude-opus-4-1-20250805,anthropic,distribution-search,15382,13927,29309,896.313803,True,1.0,claude-opus-4-1-20250805,distribution-search,896.313803,True,0.5555555555555556,True,896.313803 +f69f4d15-4421-4a0f-8f73-2008d632673f,OpenAI/gpt-oss-20B,together_ai,build-cython-ext,84,214,298,908.079582,False,0.0,OpenAI/gpt-oss-20B,build-cython-ext,908.079582,False,0.0,False,908.079582 +5a7417fe-a88b-42d5-b6a5-7b01d32763c6,gpt-5,openai,form-filling,12684,17213,29897,665.346979,True,1.0,gpt-5,form-filling,665.346979,True,0.8,True,665.346979 +3503a565-bbc9-4a0f-a91e-1b71c23dfb4d,grok-4-0709,xai,circuit-fibsqrt,4031,2181,6212,3605.816061,False,0.0,grok-4-0709,circuit-fibsqrt,3605.816061,False,0.0,False,3605.816061 +03e75e83-d09e-4936-a970-f869509dae21,grok-code-fast-1,xai,git-leak-recovery,1177,535,1712,77.518181,False,0.0,grok-code-fast-1,git-leak-recovery,77.518181,False,0.2,False,77.518181 +4f48eaee-cc2e-4f71-9624-fefc9da2945a,grok-code-fast-1,xai,crack-7z-hash,13873,2677,16550,657.528846,True,1.0,grok-code-fast-1,crack-7z-hash,657.528846,True,0.6,True,657.528846 +c69c8afe-4980-46eb-a46d-13aefce461a8,gpt-5-nano,openai,fix-ocaml-gc,17334,8306,25640,3602.946318,False,0.0,gpt-5-nano,fix-ocaml-gc,3602.946318,False,0.0,False,3602.946318 +00b3868a-38bf-42c8-bb15-d45f22f48f65,claude-sonnet-4-20250514,anthropic,crack-7z-hash,5816,3897,9713,411.545471,True,1.0,claude-sonnet-4-20250514,crack-7z-hash,411.545471,True,1.0,True,411.545471 +49d38b2b-5e4b-4efe-9838-67ac611ec8b5,zai-org/GLM-4.5-Air-FP8,together_ai,sanitize-git-repo,13505,4397,17902,496.186615,False,0.0,zai-org/GLM-4.5-Air-FP8,sanitize-git-repo,496.186615,False,0.0,False,496.186615 +622fd5f6-741a-44db-9935-6008fcd31d34,gpt-5,openai,sqlite-with-gcov,5122,1911,7033,325.941034,False,0.0,gpt-5,sqlite-with-gcov,325.941034,False,0.3333333333333333,False,325.941034 +1fc05812-b820-4c06-9bb0-81b75658e7b7,gpt-5-mini,openai,polyglot-c-py,1596,1771,3367,390.116905,False,0.0,gpt-5-mini,polyglot-c-py,390.116905,False,0.0,False,390.116905 +438da45e-2138-499c-960b-37923d6859ab,moonshotai/Kimi-K2-Instruct-0905,together_ai,largest-eigenval,5467,4309,9776,908.713165,False,0.0,moonshotai/Kimi-K2-Instruct-0905,largest-eigenval,908.713165,False,0.2,False,908.713165 +3905f39f-c343-4047-81da-e09760ba7025,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-windows-3.11,6996,1480,8476,154.505019,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-windows-3.11,154.505019,False,0.0,False,154.505019 +bde404ca-0f41-43a6-b5ba-422c1815aa3b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-klee-minimal,8449,2582,11031,900.013688,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-klee-minimal,900.013688,False,0.0,False,900.013688 +0a20299f-a983-4f70-bfc6-54084b805f60,openai/gpt-oss-120b,together_ai,largest-eigenval,9421,9334,18755,912.980275,False,0.0,openai/gpt-oss-120b,largest-eigenval,912.980275,False,0.0,False,912.980275 +189c55ce-6e82-4ee6-bd1e-0e4e43e39794,moonshotai/Kimi-K2-Instruct-0905,together_ai,write-compressor,9250,11019,20269,900.378559,False,0.0,moonshotai/Kimi-K2-Instruct-0905,write-compressor,900.378559,False,0.0,False,900.378559 +d4bd0d04-9a65-4d12-bbc1-3a5d52b9f3f5,gpt-5,openai,regex-log,1648,1575,3223,217.944763,True,1.0,gpt-5,regex-log,217.944763,True,1.0,True,217.944763 +55cda5ed-9883-4b5c-8579-f555e695fe89,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,gpt2-codegolf,11732,12642,24374,904.096074,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,gpt2-codegolf,904.096074,False,0.0,False,904.096074 +9a54e3a4-4fe9-4c19-baf8-624080d4157d,grok-4-0709,xai,count-dataset-tokens,11139,2852,13991,910.963149,False,0.0,grok-4-0709,count-dataset-tokens,910.963149,False,0.0,False,910.963149 +c93402dc-192f-498c-8db8-247f1b3249cf,grok-4-0709,xai,large-scale-text-editing,2116,1614,3730,1200.487176,False,0.0,grok-4-0709,large-scale-text-editing,1200.487176,False,0.4,False,1200.487176 +cad37194-b58f-458f-a779-5f3b984bc7fb,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pov-ray,20054,8289,28343,1779.940368,True,1.0,moonshotai/Kimi-K2-Instruct-0905,build-pov-ray,1779.940368,True,1.0,True,1779.940368 +562ac434-8192-4567-ba00-414ee15d82b0,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing-reverse,8559,8765,17324,737.642621,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing-reverse,737.642621,False,0.0,False,737.642621 +4623c750-29fe-439d-9da3-5e054c4f4487,gpt-5-nano,openai,large-scale-text-editing,10557,10051,20608,1219.124585,False,0.0,gpt-5-nano,large-scale-text-editing,1219.124585,False,0.0,False,1219.124585 +9287adce-e437-43a9-a80a-7024048aff5a,gpt-5-mini,openai,crack-7z-hash,9434,5136,14570,544.50342,False,0.0,gpt-5-mini,crack-7z-hash,544.50342,False,0.0,False,544.50342 +2c31ca6e-d20f-47f7-bb24-b24ba694b441,gpt-5,openai,break-filter-js-from-html,2691,1500,4191,221.7925,False,0.0,gpt-5,break-filter-js-from-html,221.7925,False,0.4285714285714285,False,221.7925 +2b942958-a411-4a13-bdec-767ced7a9a7f,gemini-2.5-flash,gemini,path-tracing-reverse,8386,24435,32821,1800.932954,False,0.0,gemini-2.5-flash,path-tracing-reverse,1800.932954,False,0.0,False,1800.932954 +967301e6-a3da-4932-97db-329020ce7f6e,grok-code-fast-1,xai,fix-git,2342,2268,4610,260.749011,True,1.0,grok-code-fast-1,fix-git,260.749011,True,0.2,True,260.749011 +b2860e8f-0ee3-42b2-af10-ad425d7d089b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,prove-plus-comm,1321,1182,2503,80.412506,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,prove-plus-comm,80.412506,False,0.0,False,80.412506 +41dfa544-50cf-4458-9542-a52b6c78115b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,financial-document-processor,8803,3563,12366,216.610444,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,financial-document-processor,216.610444,False,0.0,False,216.610444 +fb4b0c44-d06d-4c8b-94af-ca6f8836f660,gpt-5,openai,crack-7z-hash,2432,2240,4672,900.001286,False,0.0,gpt-5,crack-7z-hash,900.001286,False,0.4285714285714285,False,900.001286 +9df4c247-fed5-4d32-b2c2-9e6bdc72a573,gpt-5,openai,winning-avg-corewars,10774,8940,19714,974.993514,True,1.0,gpt-5,winning-avg-corewars,974.993514,True,0.2857142857142857,True,974.993514 +ce28af1d-f127-4f80-81ee-c5d53ff81b0a,gemini-2.5-pro,gemini,write-compressor,12319,9711,22030,930.475917,False,0.0,gemini-2.5-pro,write-compressor,930.475917,False,0.0,False,930.475917 +bced4c14-26c3-4a76-a701-2a0668122540,grok-code-fast-1,xai,build-pov-ray,1457,1184,2641,188.477947,False,0.0,grok-code-fast-1,build-pov-ray,188.477947,False,0.2,False,188.477947 +1458a7c2-1249-4032-a516-3e4598c1a0e3,deepseek-ai/DeepSeek-V3.1,together_ai,build-pmars,11576,2436,14012,236.012856,True,1.0,deepseek-ai/DeepSeek-V3.1,build-pmars,236.012856,True,1.0,True,236.012856 +06f54a6d-e2e8-4543-aefa-23f6f8aa2259,grok-4-0709,xai,largest-eigenval,8238,4177,12415,900.051819,False,0.0,grok-4-0709,largest-eigenval,900.051819,False,0.0,False,900.051819 +938d6b2d-b5c7-404f-92ce-5226f75754c8,grok-code-fast-1,xai,db-wal-recovery,2187,2533,4720,122.183828,False,0.0,grok-code-fast-1,db-wal-recovery,122.183828,False,0.0,False,122.183828 +e5ded101-a798-460f-94f9-cb01ac5cc0f3,claude-sonnet-4-20250514,anthropic,qemu-alpine-ssh,2166,3414,5580,551.596622,False,0.0,claude-sonnet-4-20250514,qemu-alpine-ssh,551.596622,False,0.6,False,551.596622 +3571d2e4-6aa9-4289-bf01-10cc763e75e9,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-initramfs-qemu,3213,3451,6664,328.104842,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-initramfs-qemu,328.104842,False,0.0,False,328.104842 +becd73ba-978c-4b84-874f-e2679e017d1a,grok-4-0709,xai,db-wal-recovery,3641,3189,6830,914.233676,False,0.0,grok-4-0709,db-wal-recovery,914.233676,False,0.2,False,914.233676 +5b16a7e3-80c6-4b7a-be8a-d47f977c7ce0,claude-opus-4-1-20250805,anthropic,log-summary-date-ranges,6917,1517,8434,109.058518,True,1.0,claude-opus-4-1-20250805,log-summary-date-ranges,109.058518,True,0.8888888888888888,True,109.058518 +9a82236c-73aa-4933-9072-6170ec8f32ab,OpenAI/gpt-oss-20B,together_ai,install-klee-minimal,1565,1374,2939,472.458872,False,0.0,OpenAI/gpt-oss-20B,install-klee-minimal,472.458872,False,0.0,False,472.458872 +2de1ebb3-c9f1-44a3-81b1-5b374965db82,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,configure-git-webserver,7530,3445,10975,668.713229,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,configure-git-webserver,668.713229,True,0.6,True,668.713229 +6423921b-b1f5-43f0-a5d2-1f12b805a9dd,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,hf-model-inference,8670,4147,12817,334.198409,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,hf-model-inference,334.198409,False,0.0,False,334.198409 +e251ab03-2b20-48d3-8c5f-8ca18e6de1a8,moonshotai/Kimi-K2-Instruct-0905,together_ai,reshard-c4-data,7938,5578,13516,448.617127,False,0.0,moonshotai/Kimi-K2-Instruct-0905,reshard-c4-data,448.617127,False,0.0,False,448.617127 +6a76852c-afc2-46be-9bbd-cac5c6e07fdd,gemini-2.5-flash,gemini,polyglot-c-py,5363,6404,11767,900.039161,False,0.0,gemini-2.5-flash,polyglot-c-py,900.039161,False,0.0,False,900.039161 +a72f974b-b3d7-4dab-b976-6195c30a5d43,claude-sonnet-4-20250514,anthropic,extract-elf,6151,3524,9675,324.353545,False,0.0,claude-sonnet-4-20250514,extract-elf,324.353545,False,0.2,False,324.353545 +21342448-ee8a-43a7-b5e1-ed20b3eb879a,grok-4-0709,xai,prove-plus-comm,1881,1384,3265,464.475587,True,1.0,grok-4-0709,prove-plus-comm,464.475587,True,0.8,True,464.475587 +4dd404b1-9531-4591-bc85-7365e9d1cf32,gpt-5-nano,openai,install-windows-3.11,7401,7425,14826,3627.529185,False,0.0,gpt-5-nano,install-windows-3.11,3627.529185,False,0.0,False,3627.529185 +b901d937-656c-415e-a1cd-3580abbc9d8c,openai/gpt-oss-120b,together_ai,distribution-search,2061,2047,4108,105.243984,False,0.0,openai/gpt-oss-120b,distribution-search,105.243984,False,0.0,False,105.243984 +7b30fbc4-b009-40cd-8b17-bad7ff090b74,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,large-scale-text-editing,6955,6080,13035,1244.966098,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,large-scale-text-editing,1244.966098,False,0.0,False,1244.966098 +a58d9461-6cc5-4423-886a-a4bd539608a0,claude-opus-4-1-20250805,anthropic,cancel-async-tasks,3548,3026,6574,103.413376,False,0.0,claude-opus-4-1-20250805,cancel-async-tasks,103.413376,False,0.125,False,103.413376 +dfbb884a-fa7f-416a-8531-27b400316d35,gpt-5,openai,feal-differential-cryptanalysis,2942,1718,4660,428.680043,False,0.0,gpt-5,feal-differential-cryptanalysis,428.680043,False,0.0,False,428.680043 +1d6a1188-f00f-4522-a9c4-db252d7759b3,gpt-5,openai,fix-ocaml-gc,28957,34448,63405,3600.002266,False,0.0,gpt-5,fix-ocaml-gc,3600.002266,False,0.0,False,3600.002266 +e352fcac-0c21-40bc-a7ce-04c68b369378,gemini-2.5-pro,gemini,run-pdp11-code,10101,5815,15916,1016.359131,False,0.0,gemini-2.5-pro,run-pdp11-code,1016.359131,False,0.0,False,1016.359131 +9f08c12f-1a42-4314-976a-2168025736c3,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pmars,17337,5054,22391,753.10938,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pmars,753.10938,True,1.0,True,753.10938 +d879309a-4d8f-4aee-a7ae-f05d0f15b2c3,gpt-5,openai,cancel-async-tasks,1552,1080,2632,109.211802,False,0.0,gpt-5,cancel-async-tasks,109.211802,False,0.6,False,109.211802 +f1c98275-ca46-489c-9643-8f4889df9e67,claude-opus-4-1-20250805,anthropic,winning-avg-corewars,49800,45035,94835,3600.148603,False,0.0,claude-opus-4-1-20250805,winning-avg-corewars,3600.148603,False,0.3333333333333333,False,3600.148603 +92666a36-d44e-4dad-9bab-d1f3563a4938,moonshotai/Kimi-K2-Instruct-0905,together_ai,chess-best-move,8584,9602,18186,773.527844,False,0.0,moonshotai/Kimi-K2-Instruct-0905,chess-best-move,773.527844,False,0.0,False,773.527844 +f9df8f65-4ad8-4f2a-9646-f3267652e4a9,zai-org/GLM-4.5-Air-FP8,together_ai,cancel-async-tasks,968,1275,2243,204.080652,False,0.0,zai-org/GLM-4.5-Air-FP8,cancel-async-tasks,204.080652,False,0.2,False,204.080652 +a3d50e87-de59-4380-864a-d6635e8262eb,gpt-5-nano,openai,circuit-fibsqrt,37660,40474,78134,3607.975236,False,0.0,gpt-5-nano,circuit-fibsqrt,3607.975236,False,0.0,False,3607.975236 +f1ce53fa-a70e-49db-9f18-837c764d047e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,break-filter-js-from-html,6857,9721,16578,1249.662433,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,break-filter-js-from-html,1249.662433,False,0.0,False,1249.662433 +7d5a1b21-6d5a-493d-96f8-97570ba74cc2,gpt-5,openai,run-pdp11-code,3720,2829,6549,1003.639201,False,0.0,gpt-5,run-pdp11-code,1003.639201,False,0.0,False,1003.639201 +c9e5da16-613d-4f92-80f1-38029855cf5b,claude-sonnet-4-20250514,anthropic,run-pdp11-code,11134,7542,18676,625.90093,False,0.0,claude-sonnet-4-20250514,run-pdp11-code,625.90093,False,0.0,False,625.90093 +9ecda2b6-6eb7-4bf9-a9d8-a6a96685873d,grok-code-fast-1,xai,pypi-server,4312,1811,6123,220.468185,True,1.0,grok-code-fast-1,pypi-server,220.468185,True,0.8,True,220.468185 +cd1509f6-d2bd-4001-bb24-77d140667d78,gemini-2.5-flash,gemini,schemelike-metacircular-eval,18701,61244,79945,2424.79551,True,1.0,gemini-2.5-flash,schemelike-metacircular-eval,2424.79551,True,0.2,True,2424.79551 +4fd8980d-e426-4a44-9874-36ec457c15f8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-recovery,12787,7032,19819,430.819549,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-recovery,430.819549,True,0.8,True,430.819549 +e3d620b9-73cb-40d1-b0ba-495a6f98440a,grok-code-fast-1,xai,count-dataset-tokens,9842,3163,13005,525.354606,False,0.0,grok-code-fast-1,count-dataset-tokens,525.354606,False,0.0,False,525.354606 +394497fa-7998-425e-ba88-32f7cae9bafc,grok-code-fast-1,xai,nginx-request-logging,4245,5157,9402,349.288517,False,0.0,grok-code-fast-1,nginx-request-logging,349.288517,False,0.0,False,349.288517 +9dbca2e3-c4f5-48ff-9ed4-d824c252c2c1,gemini-2.5-pro,gemini,fix-git,3716,1886,5602,146.54887,True,1.0,gemini-2.5-pro,fix-git,146.54887,True,1.0,True,146.54887 +ee94edce-4024-4e57-928d-1bc20d4db412,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,count-dataset-tokens,8934,3320,12254,660.523458,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,count-dataset-tokens,660.523458,False,0.0,False,660.523458 +1737acd6-bc8f-4704-ba36-ab214e8bc851,gemini-2.5-flash,gemini,install-klee-minimal,11299,2635,13934,900.065827,False,0.0,gemini-2.5-flash,install-klee-minimal,900.065827,False,0.0,False,900.065827 +65f195a6-067f-4ba5-a867-9106500f4a41,claude-sonnet-4-20250514,anthropic,filter-js-from-html,5918,6222,12140,901.335032,False,0.0,claude-sonnet-4-20250514,filter-js-from-html,901.335032,False,0.0,False,901.335032 +71bf0f3c-ca18-454d-8ce7-106abe7e4ba9,gpt-5-nano,openai,wasm-pipeline,12806,15564,28370,910.489231,False,0.0,gpt-5-nano,wasm-pipeline,910.489231,False,0.0,False,910.489231 +af44d6e2-e890-4da5-bd1c-87b6f74aab9f,gpt-5-mini,openai,build-cython-ext,10910,4007,14917,904.489212,False,0.0,gpt-5-mini,build-cython-ext,904.489212,False,0.2,False,904.489212 +11bccd25-6a06-4148-81fe-cfc088994109,claude-opus-4-1-20250805,anthropic,nginx-request-logging,7362,3084,10446,638.090941,True,1.0,claude-opus-4-1-20250805,nginx-request-logging,638.090941,True,1.0,True,638.090941 +da528a2d-7a4f-483b-b4ef-844a2a4da5b2,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,vulnerable-secret,2493,2798,5291,97.466118,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,vulnerable-secret,97.466118,False,0.0,False,97.466118 +a5b128fd-ae8c-4096-a1d9-652883d27b90,gpt-5-mini,openai,make-mips-interpreter,16023,29906,45929,1801.298598,False,0.0,gpt-5-mini,make-mips-interpreter,1801.298598,False,0.0,False,1801.298598 +05a8f0e7-3275-4e52-b132-059c3051163e,gemini-2.5-pro,gemini,regex-log,1468,1441,2909,219.624419,True,1.0,gemini-2.5-pro,regex-log,219.624419,True,0.8,True,219.624419 +2d475720-4f6e-4d19-b7d2-e0c6b6f45179,openai/gpt-oss-120b,together_ai,make-mips-interpreter,16881,13308,30189,1810.701113,False,0.0,openai/gpt-oss-120b,make-mips-interpreter,1810.701113,False,0.0,False,1810.701113 +664b1a7c-a3f9-44b7-b27f-53010ecd4d04,gemini-2.5-pro,gemini,configure-git-webserver,5262,1373,6635,794.839694,False,0.0,gemini-2.5-pro,configure-git-webserver,794.839694,False,0.0,False,794.839694 +5852e644-02a5-4a15-b7bc-86af6e464aa1,claude-sonnet-4-20250514,anthropic,circuit-fibsqrt,15496,15701,31197,1840.893847,False,0.0,claude-sonnet-4-20250514,circuit-fibsqrt,1840.893847,False,0.0,False,1840.893847 +77c0bb18-fe71-4d18-aa9a-c3479ad29348,OpenAI/gpt-oss-20B,together_ai,pytorch-model-recovery,2222,12669,14891,900.959363,False,0.0,OpenAI/gpt-oss-20B,pytorch-model-recovery,900.959363,False,0.0,False,900.959363 +ca89ec53-ac5b-4b58-a815-b2ef8c7acc64,gpt-5-nano,openai,log-summary-date-ranges,15409,11973,27382,569.005703,False,0.0,gpt-5-nano,log-summary-date-ranges,569.005703,False,0.0,False,569.005703 +ac945708-daec-418a-9965-578dc75284bb,gpt-5,openai,sqlite-db-truncate,7163,5143,12306,622.8403,False,0.0,gpt-5,sqlite-db-truncate,622.8403,False,0.0,False,622.8403 +dac5886f-b7af-45b5-add6-b14513335287,grok-code-fast-1,xai,pytorch-model-cli,1398,1131,2529,41.815983,False,0.0,grok-code-fast-1,pytorch-model-cli,41.815983,False,0.0,False,41.815983 +0860c205-ef2b-4e3e-8f5d-94353bd75f3f,claude-opus-4-1-20250805,anthropic,prove-plus-comm,1630,1123,2753,42.635086,True,1.0,claude-opus-4-1-20250805,prove-plus-comm,42.635086,True,1.0,True,42.635086 +2ee9af8f-e91d-4a56-9ff8-64ca92b18ba7,openai/gpt-oss-120b,together_ai,pytorch-model-cli,1245,960,2205,225.341036,False,0.0,openai/gpt-oss-120b,pytorch-model-cli,225.341036,False,0.0,False,225.341036 +75686b99-aaee-470c-aa2b-218413f22ef6,grok-4-0709,xai,chess-best-move,10218,2775,12993,917.131429,False,0.0,grok-4-0709,chess-best-move,917.131429,False,0.0,False,917.131429 +a2e17e65-5d9b-45cc-9cbc-e9f79b1de82f,gemini-2.5-flash,gemini,largest-eigenval,6678,6162,12840,908.089323,False,0.0,gemini-2.5-flash,largest-eigenval,908.089323,False,0.0,False,908.089323 +23a1fe6f-4b26-4a39-b888-49cb5b80b99c,claude-sonnet-4-20250514,anthropic,polyglot-c-py,7253,5248,12501,209.998694,False,0.0,claude-sonnet-4-20250514,polyglot-c-py,209.998694,False,0.0,False,209.998694 +eebee320-bc48-412e-9d6a-f3a116f7a014,openai/gpt-oss-120b,together_ai,constraints-scheduling,3590,2507,6097,47.99831,True,1.0,openai/gpt-oss-120b,constraints-scheduling,47.99831,True,1.0,True,47.99831 +4fae0c4c-f3c1-48a0-8d6d-31e283f316ed,grok-4-0709,xai,password-recovery,1823,1354,3177,1549.61206,False,0.0,grok-4-0709,password-recovery,1549.61206,False,0.0,False,1549.61206 +b35f5b57-f56d-4958-8137-8cc6e3d73957,OpenAI/gpt-oss-20B,together_ai,code-from-image,273,275,548,42.88561,False,0.0,OpenAI/gpt-oss-20B,code-from-image,42.88561,False,0.0,False,42.88561 +a85b0731-f46b-401f-b2ec-75a5b5bed178,grok-4-0709,xai,hf-model-inference,3923,1749,5672,460.246729,True,1.0,grok-4-0709,hf-model-inference,460.246729,True,1.0,True,460.246729 +289ebe1c-5513-447d-b30c-4c4ccda1d500,claude-opus-4-1-20250805,anthropic,polyglot-rust-c,11861,10888,22749,931.888686,False,0.0,claude-opus-4-1-20250805,polyglot-rust-c,931.888686,False,0.0,False,931.888686 +e359f792-5f92-4b75-b18d-ca66c5589226,claude-opus-4-1-20250805,anthropic,circuit-fibsqrt,35031,30979,66010,3600.00101,False,0.0,claude-opus-4-1-20250805,circuit-fibsqrt,3600.00101,False,0.0,False,3600.00101 +4d5a7857-dda2-44ef-933b-ebee4ddb8e43,deepseek-ai/DeepSeek-V3.1,together_ai,break-filter-js-from-html,2085,1888,3973,168.862087,False,0.0,deepseek-ai/DeepSeek-V3.1,break-filter-js-from-html,168.862087,False,0.0,False,168.862087 +7111a952-bb48-4637-bcc5-90e2b2a6e645,claude-opus-4-1-20250805,anthropic,fix-ocaml-gc,71949,44906,116855,2914.706675,True,1.0,claude-opus-4-1-20250805,fix-ocaml-gc,2914.706675,True,0.5,True,2914.706675 +57141c5b-894c-4a75-8e4f-067bda64fd7d,claude-opus-4-1-20250805,anthropic,run-pdp11-code,7091,5649,12740,507.681048,False,0.0,claude-opus-4-1-20250805,run-pdp11-code,507.681048,False,0.0,False,507.681048 +f3aaaa56-3b9c-4dbd-bfb8-68e1a418e5d4,zai-org/GLM-4.5-Air-FP8,together_ai,install-windows-3.11,7845,2808,10653,256.979049,False,0.0,zai-org/GLM-4.5-Air-FP8,install-windows-3.11,256.979049,False,0.0,False,256.979049 +5476fd2a-cbac-4616-8dad-538df3dad114,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,feal-differential-cryptanalysis,3860,2351,6211,117.847508,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,feal-differential-cryptanalysis,117.847508,False,0.0,False,117.847508 +d93d4b90-685d-4b01-881c-e2fda359eaa4,OpenAI/gpt-oss-20B,together_ai,video-processing,904,1672,2576,126.6624,False,0.0,OpenAI/gpt-oss-20B,video-processing,126.6624,False,0.0,False,126.6624 +f2f0e62a-53d6-46e4-8079-18e35b7275b0,gpt-5-nano,openai,make-doom-for-mips,15306,4174,19480,908.780469,False,0.0,gpt-5-nano,make-doom-for-mips,908.780469,False,0.0,False,908.780469 +e3cc33a2-fdc7-4956-92ca-7ad94ee08590,grok-code-fast-1,xai,build-pmars,14970,3584,18554,330.507402,True,1.0,grok-code-fast-1,build-pmars,330.507402,True,0.8,True,330.507402 +15e6a4da-5f5f-44c7-ab4f-31495d6aeee2,zai-org/GLM-4.5-Air-FP8,together_ai,fix-code-vulnerability,11452,5863,17315,1034.219472,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-code-vulnerability,1034.219472,False,0.0,False,1034.219472 +eacbe383-7502-40f8-abae-23c21dcbb715,claude-opus-4-1-20250805,anthropic,run-pdp11-code,4948,3857,8805,165.716155,False,0.0,claude-opus-4-1-20250805,run-pdp11-code,165.716155,False,0.0,False,165.716155 +2c7c7e86-cf68-4505-9e2d-5ff42416f989,gpt-5-nano,openai,chess-best-move,21023,13418,34441,901.766858,False,0.0,gpt-5-nano,chess-best-move,901.766858,False,0.0,False,901.766858 +a904a358-9444-48b2-9eba-1f11512c38e3,gpt-5-nano,openai,db-wal-recovery,6757,8513,15270,1029.392734,False,0.0,gpt-5-nano,db-wal-recovery,1029.392734,False,0.0,False,1029.392734 +863f0fa2-4254-4da1-b6b5-cf6685825362,claude-sonnet-4-20250514,anthropic,wasm-pipeline,19138,6924,26062,798.060662,False,0.0,claude-sonnet-4-20250514,wasm-pipeline,798.060662,False,0.6,False,798.060662 +815c3e02-432b-4731-bfcb-6c12f69a8b21,zai-org/GLM-4.5-Air-FP8,together_ai,crack-7z-hash,12022,8768,20790,900.763471,False,0.0,zai-org/GLM-4.5-Air-FP8,crack-7z-hash,900.763471,False,0.0,False,900.763471 +e0092756-f974-48d3-9739-47acdd80b5ea,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,adaptive-rejection-sampler,12306,7111,19417,905.828396,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,adaptive-rejection-sampler,905.828396,False,0.0,False,905.828396 +db138fc4-725e-4613-b599-6823738a4c07,grok-4-0709,xai,largest-eigenval,10045,5682,15727,902.725174,False,0.0,grok-4-0709,largest-eigenval,902.725174,False,0.0,False,902.725174 +865a1dbd-87b9-4299-960b-266a47f8fccd,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sanitize-git-repo,15829,3600,19429,368.31449,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sanitize-git-repo,368.31449,False,0.0,False,368.31449 +b83d72b2-807e-4d72-9e83-03a2f325debc,claude-opus-4-1-20250805,anthropic,regex-log,2933,2689,5622,159.970616,True,1.0,claude-opus-4-1-20250805,regex-log,159.970616,True,0.5714285714285714,True,159.970616 +ff59fa90-6cf3-4473-a07f-9d78e7f802dc,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-db-truncate,2178,2722,4900,686.913767,False,0.0,zai-org/GLM-4.5-Air-FP8,sqlite-db-truncate,686.913767,False,0.0,False,686.913767 +aaf28db0-7afb-445d-98c7-b0b6ea17ddb1,openai/gpt-oss-120b,together_ai,make-mips-interpreter,15494,9176,24670,1802.664278,False,0.0,openai/gpt-oss-120b,make-mips-interpreter,1802.664278,False,0.0,False,1802.664278 +d78c2f30-c4d2-4eac-bf8e-2ed0a1883628,gemini-2.5-flash,gemini,form-filling,25694,45237,70931,909.09964,False,0.0,gemini-2.5-flash,form-filling,909.09964,False,0.0,False,909.09964 +374a8aba-7613-4678-834c-bd7638170198,claude-sonnet-4-20250514,anthropic,git-leak-recovery,3304,3564,6868,519.911198,True,1.0,claude-sonnet-4-20250514,git-leak-recovery,519.911198,True,1.0,True,519.911198 +183629c0-2a41-4b88-a2cb-dfd5545393f4,OpenAI/gpt-oss-20B,together_ai,qemu-alpine-ssh,2352,10045,12397,1046.027955,False,0.0,OpenAI/gpt-oss-20B,qemu-alpine-ssh,1046.027955,False,0.0,False,1046.027955 +80f3b88a-e759-4644-adf0-d694567f935a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-leaderboard,4460,2027,6487,195.191571,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-leaderboard,195.191571,False,0.0,False,195.191571 +471a30d0-ad55-4fee-bae0-ffd41c9c740e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,video-processing,2695,1977,4672,146.085358,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,video-processing,146.085358,False,0.0,False,146.085358 +ddca5d2e-c708-42f5-a5a9-b519c17c7fe8,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-db-truncate,5749,5694,11443,277.203435,False,0.0,zai-org/GLM-4.5-Air-FP8,sqlite-db-truncate,277.203435,False,0.0,False,277.203435 +8b0afaf3-c1cb-47f7-978d-73841854dd25,gemini-2.5-pro,gemini,video-processing,6488,6540,13028,621.493911,False,0.0,gemini-2.5-pro,video-processing,621.493911,False,0.0,False,621.493911 +9aec2289-409b-498e-b4cb-591fe49ad2ba,deepseek-ai/DeepSeek-V3.1,together_ai,bn-fit-modify,29905,21169,51074,3003.956623,False,0.0,deepseek-ai/DeepSeek-V3.1,bn-fit-modify,3003.956623,False,0.0,False,3003.956623 +85726105-f0d0-4bac-8949-7239a5c34eb2,grok-code-fast-1,xai,schemelike-metacircular-eval,3963,2599,6562,85.881396,False,0.0,grok-code-fast-1,schemelike-metacircular-eval,85.881396,False,0.0,False,85.881396 +3cd86300-4a0a-4b72-83bd-fc2d03672e15,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,code-from-image,8235,4895,13130,322.815884,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,code-from-image,322.815884,True,0.2,True,322.815884 +df555d26-9e80-4b31-836b-0513732216e5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,schemelike-metacircular-eval,13403,8390,21793,399.608925,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,schemelike-metacircular-eval,399.608925,False,0.0,False,399.608925 +5981f001-af9c-46a4-8613-e7d2b3e83a83,gpt-5,openai,prove-plus-comm,1802,1249,3051,360.230246,False,0.0,gpt-5,prove-plus-comm,360.230246,False,0.8571428571428571,False,360.230246 +4585c41e-32e5-405b-8c54-19fc2ced7d3d,claude-opus-4-1-20250805,anthropic,adaptive-rejection-sampler,6281,3473,9754,900.001006,False,0.0,claude-opus-4-1-20250805,adaptive-rejection-sampler,900.001006,False,0.125,False,900.001006 +1df9c3c1-be10-4ba4-825d-809d1038a77e,grok-code-fast-1,xai,tune-mjcf,5752,5595,11347,548.133842,False,0.0,grok-code-fast-1,tune-mjcf,548.133842,False,0.4,False,548.133842 +c241138e-39d6-47e4-aa0b-9cc1f7ea66db,grok-4-0709,xai,count-dataset-tokens,18064,3286,21350,874.135824,False,0.0,grok-4-0709,count-dataset-tokens,874.135824,False,0.0,False,874.135824 +95dcd984-798b-4428-aefa-c0367feaaefa,openai/gpt-oss-120b,together_ai,sparql-university,1522,770,2292,138.075652,False,0.0,openai/gpt-oss-120b,sparql-university,138.075652,False,0.0,False,138.075652 +91c244c5-c83d-4a36-b897-31b0236caa8a,moonshotai/Kimi-K2-Instruct-0905,together_ai,run-pdp11-code,3733,3061,6794,1001.317613,False,0.0,moonshotai/Kimi-K2-Instruct-0905,run-pdp11-code,1001.317613,False,0.0,False,1001.317613 +e95c6568-e2af-4706-af63-cf3299e21537,grok-code-fast-1,xai,pytorch-model-recovery,6514,3279,9793,210.826855,True,1.0,grok-code-fast-1,pytorch-model-recovery,210.826855,True,0.8,True,210.826855 +ee895e13-0c39-4d00-b6b8-9173df0f3fde,zai-org/GLM-4.5-Air-FP8,together_ai,break-filter-js-from-html,2555,3101,5656,768.959523,False,0.0,zai-org/GLM-4.5-Air-FP8,break-filter-js-from-html,768.959523,False,0.0,False,768.959523 +291d4605-6f73-42e3-b62c-245b63536a2e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,merge-diff-arc-agi-task,6445,1763,8208,926.567994,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,merge-diff-arc-agi-task,926.567994,False,0.4,False,926.567994 +65b2f282-c1a8-4eba-ad74-8823dc4a2124,gemini-2.5-flash,gemini,schemelike-metacircular-eval,23127,16998,40125,2407.326708,False,0.0,gemini-2.5-flash,schemelike-metacircular-eval,2407.326708,False,0.2,False,2407.326708 +dfc9658d-b782-4ac2-9dbf-f521957733bb,zai-org/GLM-4.5-Air-FP8,together_ai,distribution-search,26979,26564,53543,1558.271111,False,0.0,zai-org/GLM-4.5-Air-FP8,distribution-search,1558.271111,False,0.0,False,1558.271111 +4ce53677-4b76-4d33-a901-034a0562418f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,merge-diff-arc-agi-task,9132,3377,12509,388.994456,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,merge-diff-arc-agi-task,388.994456,True,0.4,True,388.994456 +b6d8e351-37b1-4d5e-9141-6ad8945ad922,grok-4-0709,xai,adaptive-rejection-sampler,7417,6882,14299,900.161335,False,0.0,grok-4-0709,adaptive-rejection-sampler,900.161335,False,0.0,False,900.161335 +0b39aa41-2fd9-41a1-811f-1d4498e0c9ee,OpenAI/gpt-oss-20B,together_ai,torch-tensor-parallelism,175,173,348,110.700496,False,0.0,OpenAI/gpt-oss-20B,torch-tensor-parallelism,110.700496,False,0.0,False,110.700496 +e8ce1179-b3e5-406a-9e28-675bfe510eb0,openai/gpt-oss-120b,together_ai,cancel-async-tasks,1361,764,2125,84.453769,True,1.0,openai/gpt-oss-120b,cancel-async-tasks,84.453769,True,0.6,True,84.453769 +b8ab6e99-fd03-4610-8677-8b6d0db9e00f,gpt-5,openai,schemelike-metacircular-eval,12802,42132,54934,2400.010103,False,0.0,gpt-5,schemelike-metacircular-eval,2400.010103,False,0.0,False,2400.010103 +a9544ebb-ae24-4d40-bd06-a6a7924202c0,grok-4-0709,xai,tune-mjcf,4788,3845,8633,903.023304,False,0.0,grok-4-0709,tune-mjcf,903.023304,False,0.0,False,903.023304 +c0a1191e-b461-4446-91cd-b6eecd3c17a7,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-assembly,9311,5189,14500,748.774548,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-assembly,748.774548,False,0.0,False,748.774548 +a79ab506-a529-489d-b2b1-6d39587c5ef9,zai-org/GLM-4.5-Air-FP8,together_ai,prove-plus-comm,2677,3445,6122,166.383672,True,1.0,zai-org/GLM-4.5-Air-FP8,prove-plus-comm,166.383672,True,0.8,True,166.383672 +9b9e8459-3941-4868-94e5-1ae0a26950a1,zai-org/GLM-4.5-Air-FP8,together_ai,nginx-request-logging,3942,2463,6405,347.928665,True,1.0,zai-org/GLM-4.5-Air-FP8,nginx-request-logging,347.928665,True,1.0,True,347.928665 +1f358e6d-0c41-4026-b2b9-5facdf6758d5,gpt-5-mini,openai,crack-7z-hash,1239,561,1800,38.473258,False,0.0,gpt-5-mini,crack-7z-hash,38.473258,False,0.0,False,38.473258 +81b5d0ef-a117-40a7-89b2-feeb63b7af14,gpt-5-mini,openai,hf-model-inference,2361,1592,3953,172.569239,True,1.0,gpt-5-mini,hf-model-inference,172.569239,True,0.8,True,172.569239 +89c27691-aeea-4d08-84c4-61e55d951d59,claude-opus-4-1-20250805,anthropic,vulnerable-secret,2458,1963,4421,972.908078,False,0.0,claude-opus-4-1-20250805,vulnerable-secret,972.908078,False,0.625,False,972.908078 +3fae39ad-14b7-495a-8c76-02cade4e259d,zai-org/GLM-4.5-Air-FP8,together_ai,cancel-async-tasks,947,989,1936,94.816883,False,0.0,zai-org/GLM-4.5-Air-FP8,cancel-async-tasks,94.816883,False,0.2,False,94.816883 +7a470ea9-c6a1-44c0-b8bf-1182dfa7291f,claude-sonnet-4-20250514,anthropic,prove-plus-comm,2511,2531,5042,279.200321,True,1.0,claude-sonnet-4-20250514,prove-plus-comm,279.200321,True,1.0,True,279.200321 +fedddab2-c70d-4c8e-8a2e-55e952b992fb,grok-code-fast-1,xai,dna-assembly,1153,539,1692,720.266035,False,0.0,grok-code-fast-1,dna-assembly,720.266035,False,0.0,False,720.266035 +0eea25f4-baf3-47ed-b4f4-048649ae57e7,openai/gpt-oss-120b,together_ai,qemu-alpine-ssh,1782,1964,3746,189.207552,False,0.0,openai/gpt-oss-120b,qemu-alpine-ssh,189.207552,False,0.0,False,189.207552 +5f1db1e7-b797-47b4-af5f-b544d065ca23,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reverse-engineering,21811,13300,35111,2578.574091,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reverse-engineering,2578.574091,False,0.0,False,2578.574091 +42979eaf-056d-47bf-b494-6908f91d1bee,OpenAI/gpt-oss-20B,together_ai,circuit-fibsqrt,833,2008,2841,81.249671,False,0.0,OpenAI/gpt-oss-20B,circuit-fibsqrt,81.249671,False,0.0,False,81.249671 +1410e098-b1a6-4180-85c0-df5f0aeb58ab,grok-4-0709,xai,pytorch-model-recovery,5394,3953,9347,912.813393,True,1.0,grok-4-0709,pytorch-model-recovery,912.813393,True,0.2,True,912.813393 +8bfbe760-e999-4237-b08f-db20f82a984d,gpt-5,openai,chess-best-move,19088,5403,24491,794.407654,False,0.0,gpt-5,chess-best-move,794.407654,False,0.0,False,794.407654 +fa8a7c63-a42f-4903-95f3-8b0c4dd7755a,gemini-2.5-flash,gemini,write-compressor,6316,13558,19874,907.29728,False,0.0,gemini-2.5-flash,write-compressor,907.29728,False,0.0,False,907.29728 +9f3a78ae-9fdb-4762-98b4-774eeeaa2cf7,grok-4-0709,xai,winning-avg-corewars,7215,12194,19409,3604.435153,False,0.0,grok-4-0709,winning-avg-corewars,3604.435153,False,0.0,False,3604.435153 +8ac69219-6e09-4cad-922d-d0a024299271,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,distribution-search,8550,10137,18687,685.730188,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,distribution-search,685.730188,True,0.4,True,685.730188 +76e202bc-cf52-4ece-9ced-ae342005c907,grok-4-0709,xai,schemelike-metacircular-eval,7395,3425,10820,2418.080746,False,0.0,grok-4-0709,schemelike-metacircular-eval,2418.080746,False,0.0,False,2418.080746 +544404d7-6db5-436d-8bf8-8e55f26cf8e4,claude-opus-4-1-20250805,anthropic,mteb-leaderboard,4001,2448,6449,309.443283,False,0.0,claude-opus-4-1-20250805,mteb-leaderboard,309.443283,False,0.0,False,309.443283 +e77fe3c6-debb-4364-a6c1-1b2ba7e3183b,gpt-5-mini,openai,mteb-leaderboard,30261,24463,54724,3630.417158,False,0.0,gpt-5-mini,mteb-leaderboard,3630.417158,False,0.0,False,3630.417158 +bef2dad9-a5a6-462e-a0cc-7fc252b2d3cf,moonshotai/Kimi-K2-Instruct-0905,together_ai,sanitize-git-repo,15347,3705,19052,705.372478,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sanitize-git-repo,705.372478,False,0.0,False,705.372478 +3c3e2a01-8ab5-44ae-87ca-4ddf8e440247,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,form-filling,15524,8724,24248,322.849715,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,form-filling,322.849715,False,0.0,False,322.849715 +0788ec95-dbb4-476c-8844-ddaa10bbeede,OpenAI/gpt-oss-20B,together_ai,password-recovery,159,566,725,95.814047,False,0.0,OpenAI/gpt-oss-20B,password-recovery,95.814047,False,0.0,False,95.814047 +762cf99c-0f31-4a46-b12e-9d77cbab715b,gemini-2.5-flash,gemini,run-pdp11-code,10809,2936,13745,346.061229,False,0.0,gemini-2.5-flash,run-pdp11-code,346.061229,False,0.0,False,346.061229 +fe619032-d2c6-46a8-874e-469faedd2136,claude-sonnet-4-20250514,anthropic,git-leak-recovery,2918,2011,4929,307.443792,True,1.0,claude-sonnet-4-20250514,git-leak-recovery,307.443792,True,1.0,True,307.443792 +e3b87aaa-7450-4898-9284-cc3736de5902,gpt-5,openai,path-tracing,15729,11170,26899,1752.015862,False,0.0,gpt-5,path-tracing,1752.015862,False,0.0,False,1752.015862 +49a0f346-d0fe-4181-9206-7555273b326d,claude-opus-4-1-20250805,anthropic,install-klee-minimal,18714,2295,21009,900.000637,False,0.0,claude-opus-4-1-20250805,install-klee-minimal,900.000637,False,0.0,False,900.000637 +60ee6912-7542-4d9b-b1e8-d290c6cfbb1b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,largest-eigenval,7940,6741,14681,611.290803,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,largest-eigenval,611.290803,True,0.2,True,611.290803 +b14d6774-d891-4203-a46d-71b1444df992,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,hf-model-inference,3218,1761,4979,122.927531,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,hf-model-inference,122.927531,True,0.8,True,122.927531 +df6e5ff7-6b56-4ecf-8e7c-f9fd7f5b4dea,moonshotai/Kimi-K2-Instruct-0905,together_ai,prove-plus-comm,1919,1334,3253,152.285369,True,1.0,moonshotai/Kimi-K2-Instruct-0905,prove-plus-comm,152.285369,True,0.8,True,152.285369 +83b972dd-44b6-44aa-ae23-4295aa5f1ac2,OpenAI/gpt-oss-20B,together_ai,reverse-engineering,723,1206,1929,457.261349,False,0.0,OpenAI/gpt-oss-20B,reverse-engineering,457.261349,False,0.0,False,457.261349 +b5323013-0018-4c91-95af-42a8586c897e,claude-sonnet-4-20250514,anthropic,constraints-scheduling,6360,3240,9600,441.858093,True,1.0,claude-sonnet-4-20250514,constraints-scheduling,441.858093,True,1.0,True,441.858093 +2c5458da-d174-40c0-87c2-1653a701e994,deepseek-ai/DeepSeek-V3.1,together_ai,reverse-engineering,9715,11838,21553,1808.092655,False,0.0,deepseek-ai/DeepSeek-V3.1,reverse-engineering,1808.092655,False,0.2,False,1808.092655 +6c7cf140-63dd-4bc5-b608-fbb0e4fff0fc,openai/gpt-oss-120b,together_ai,path-tracing-reverse,6720,14766,21486,1800.814695,False,0.0,openai/gpt-oss-120b,path-tracing-reverse,1800.814695,False,0.0,False,1800.814695 +95cced3d-837a-4195-aca9-a18ea1133954,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,vulnerable-secret,12938,9244,22182,900.17298,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,vulnerable-secret,900.17298,False,0.4,False,900.17298 +10e4783d-31c5-4116-a557-a8fe6686f4e7,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,regex-log,1182,697,1879,85.422594,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,regex-log,85.422594,False,0.0,False,85.422594 +e61b7d43-d9de-483d-9ab5-7234d8248388,grok-code-fast-1,xai,adaptive-rejection-sampler,8883,4223,13106,236.884964,False,0.0,grok-code-fast-1,adaptive-rejection-sampler,236.884964,False,0.0,False,236.884964 +0f3bb954-0af3-4922-9dc1-be22bedeb80f,grok-code-fast-1,xai,polyglot-c-py,0,0,0,902.576206,False,0.0,grok-code-fast-1,polyglot-c-py,902.576206,False,0.0,False,902.576206 +3ac442dd-ac18-4e95-9193-ff66942a9ddd,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-rust-c,9820,11713,21533,903.750118,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-rust-c,903.750118,False,0.0,False,903.750118 +4cd8953f-32d0-4fd7-9d10-702963de9804,claude-opus-4-1-20250805,anthropic,break-filter-js-from-html,10952,9368,20320,1210.427035,False,0.0,claude-opus-4-1-20250805,break-filter-js-from-html,1210.427035,False,0.2222222222222222,False,1210.427035 +161963d5-cb87-4201-b53c-d2f404212cf6,gpt-5-nano,openai,port-compressor,23073,22284,45357,3618.307337,False,0.0,gpt-5-nano,port-compressor,3618.307337,False,0.0,False,3618.307337 +8cf391f8-1562-4c0b-9ff3-740f02aff742,gpt-5,openai,count-dataset-tokens,9954,6322,16276,915.590993,False,0.0,gpt-5,count-dataset-tokens,915.590993,False,0.1666666666666666,False,915.590993 +f48e2d60-d9d0-404d-b7f0-3052388fac36,grok-code-fast-1,xai,sanitize-git-repo,7829,3594,11423,728.772342,False,0.0,grok-code-fast-1,sanitize-git-repo,728.772342,False,0.0,False,728.772342 +13cc6e17-e2a7-40b2-83bd-08d1bef6960c,gemini-2.5-pro,gemini,largest-eigenval,5681,2487,8168,904.484564,False,0.0,gemini-2.5-pro,largest-eigenval,904.484564,False,0.0,False,904.484564 +c6954ee1-ecc1-4470-9021-de12d1b58e50,moonshotai/Kimi-K2-Instruct-0905,together_ai,tune-mjcf,7050,5604,12654,657.776508,True,1.0,moonshotai/Kimi-K2-Instruct-0905,tune-mjcf,657.776508,True,0.4,True,657.776508 +e85c93ef-5a1e-49f9-82de-fb84a96a5aa2,grok-4-0709,xai,train-fasttext,22162,5879,28041,2002.210252,True,1.0,grok-4-0709,train-fasttext,2002.210252,True,0.2,True,2002.210252 +60f187bc-4a5c-4215-863f-8d6be168cf4f,claude-opus-4-1-20250805,anthropic,count-dataset-tokens,11633,2947,14580,917.745426,False,0.0,claude-opus-4-1-20250805,count-dataset-tokens,917.745426,False,0.0,False,917.745426 +549550bd-347f-4b15-94c5-a923e2fba9ca,openai/gpt-oss-120b,together_ai,qemu-alpine-ssh,3488,5477,8965,907.166709,False,0.0,openai/gpt-oss-120b,qemu-alpine-ssh,907.166709,False,0.0,False,907.166709 +b0ed129d-4062-4e12-b953-32c327456a9d,grok-4-0709,xai,pypi-server,4214,757,4971,271.967675,False,0.0,grok-4-0709,pypi-server,271.967675,False,0.4,False,271.967675 +64fc6129-ff1c-4c91-92d7-f69de3791968,openai/gpt-oss-120b,together_ai,path-tracing-reverse,25416,22787,48203,1333.044395,False,0.0,openai/gpt-oss-120b,path-tracing-reverse,1333.044395,False,0.0,False,1333.044395 +9ae33fa8-67e9-453a-af59-1457992f1cac,OpenAI/gpt-oss-20B,together_ai,constraints-scheduling,1955,2106,4061,195.872986,True,1.0,OpenAI/gpt-oss-20B,constraints-scheduling,195.872986,True,0.2,True,195.872986 +34855aac-e62a-4db5-aec5-c1d9f4ae13d4,gemini-2.5-flash,gemini,hf-model-inference,6195,1949,8144,342.702249,True,1.0,gemini-2.5-flash,hf-model-inference,342.702249,True,0.6,True,342.702249 +7e889790-c074-471d-b3cf-a1c28e3e95bf,deepseek-ai/DeepSeek-V3.1,together_ai,install-windows-3.11,7880,2692,10572,629.727973,False,0.0,deepseek-ai/DeepSeek-V3.1,install-windows-3.11,629.727973,False,0.0,False,629.727973 +7689d110-ab4a-4164-b225-86b4fc18c7e0,moonshotai/Kimi-K2-Instruct-0905,together_ai,port-compressor,61007,35480,96487,3587.103511,False,0.0,moonshotai/Kimi-K2-Instruct-0905,port-compressor,3587.103511,False,0.0,False,3587.103511 +19d78783-7ac0-43f9-8e60-146d6c189d7e,gpt-5,openai,model-extraction-relu-logits,5623,3956,9579,495.980032,False,0.0,gpt-5,model-extraction-relu-logits,495.980032,False,0.1666666666666666,False,495.980032 +8f970467-15d1-460e-83ba-852e8e198f69,openai/gpt-oss-120b,together_ai,merge-diff-arc-agi-task,7646,4917,12563,457.203985,False,0.0,openai/gpt-oss-120b,merge-diff-arc-agi-task,457.203985,False,0.0,False,457.203985 +2962dabc-034a-46bd-bf05-ff32266dae34,gpt-5-nano,openai,polyglot-rust-c,4252,4162,8414,566.271415,False,0.0,gpt-5-nano,polyglot-rust-c,566.271415,False,0.0,False,566.271415 +15a108ca-8a0f-4768-925a-797299944f3a,gpt-5,openai,pypi-server,3232,1670,4902,358.672772,False,0.0,gpt-5,pypi-server,358.672772,False,0.3333333333333333,False,358.672772 +de00bde2-f409-45d1-88d7-a6c4673035ff,moonshotai/Kimi-K2-Instruct-0905,together_ai,adaptive-rejection-sampler,16156,10905,27061,912.518545,False,0.0,moonshotai/Kimi-K2-Instruct-0905,adaptive-rejection-sampler,912.518545,False,0.0,False,912.518545 +9cb8a272-20ef-4fd3-bb45-473903962437,claude-sonnet-4-20250514,anthropic,openssl-selfsigned-cert,4213,2993,7206,249.032878,True,1.0,claude-sonnet-4-20250514,openssl-selfsigned-cert,249.032878,True,0.8,True,249.032878 +faad540d-dbfb-45a3-9ffb-9caa3a099580,openai/gpt-oss-120b,together_ai,run-pdp11-code,8111,5038,13149,291.149648,False,0.0,openai/gpt-oss-120b,run-pdp11-code,291.149648,False,0.0,False,291.149648 +ffefb40e-0cac-40e7-8326-2664eb02b251,claude-opus-4-1-20250805,anthropic,sanitize-git-repo,8891,3708,12599,185.532736,False,0.0,claude-opus-4-1-20250805,sanitize-git-repo,185.532736,False,0.0,False,185.532736 +c1e43537-c001-4206-8bb9-50256a6101df,OpenAI/gpt-oss-20B,together_ai,nginx-request-logging,1216,1335,2551,126.724406,False,0.0,OpenAI/gpt-oss-20B,nginx-request-logging,126.724406,False,0.0,False,126.724406 +98b58079-0597-4906-96e4-0cb22dc47b83,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,filter-js-from-html,6287,6172,12459,761.075136,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,filter-js-from-html,761.075136,False,0.0,False,761.075136 +0d6b6088-f877-4903-8e6b-f4f206e33b0e,gpt-5-nano,openai,chess-best-move,9511,6954,16465,534.169005,False,0.0,gpt-5-nano,chess-best-move,534.169005,False,0.0,False,534.169005 +dade16f4-a78d-4021-9b5a-bd4783cddf91,zai-org/GLM-4.5-Air-FP8,together_ai,git-leak-recovery,4155,4164,8319,343.562996,False,0.0,zai-org/GLM-4.5-Air-FP8,git-leak-recovery,343.562996,False,0.8,False,343.562996 +c5404025-c58d-40ba-a1d2-074dd8cec48e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-startup,3095,3361,6456,423.513362,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-startup,423.513362,False,0.0,False,423.513362 +7720dd5c-786d-446a-a3e7-c68b68d46b98,gemini-2.5-flash,gemini,password-recovery,12095,8054,20149,904.2988,False,0.0,gemini-2.5-flash,password-recovery,904.2988,False,0.0,False,904.2988 +4ca825b3-c639-4fe1-afe9-6d2989d64e9e,gpt-5-nano,openai,configure-git-webserver,7729,5570,13299,904.343931,True,1.0,gpt-5-nano,configure-git-webserver,904.343931,True,0.2,True,904.343931 +8d88385a-b419-4c98-a348-f99dccf825cf,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,code-from-image,2610,2436,5046,173.363513,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,code-from-image,173.363513,False,0.4,False,173.363513 +e455b5b4-27c3-454a-8206-c014fe952981,grok-code-fast-1,xai,openssl-selfsigned-cert,1668,874,2542,31.139507,False,0.0,grok-code-fast-1,openssl-selfsigned-cert,31.139507,False,0.2,False,31.139507 +46a7e4ae-b4d5-4053-bea5-842dec05f212,claude-opus-4-1-20250805,anthropic,bn-fit-modify,16490,6132,22622,3148.396303,True,1.0,claude-opus-4-1-20250805,bn-fit-modify,3148.396303,True,0.875,True,3148.396303 +cb437aa1-6441-4e43-bc41-145d50d03f97,gemini-2.5-pro,gemini,mteb-retrieve,1847,799,2646,265.08156,False,0.0,gemini-2.5-pro,mteb-retrieve,265.08156,False,0.0,False,265.08156 +bcbd87dd-589f-46bd-a450-30995fb92c16,grok-code-fast-1,xai,train-fasttext,18990,6748,25738,1730.768589,False,0.0,grok-code-fast-1,train-fasttext,1730.768589,False,0.0,False,1730.768589 +bab6229c-b11f-4c20-8b67-c20987478ac4,grok-code-fast-1,xai,break-filter-js-from-html,2991,2404,5395,476.606194,False,0.0,grok-code-fast-1,break-filter-js-from-html,476.606194,False,0.0,False,476.606194 +3eec3656-5c4c-47e3-9fe3-06c9173dde87,gpt-5-nano,openai,feal-linear-cryptanalysis,8880,11915,20795,1801.069087,False,0.0,gpt-5-nano,feal-linear-cryptanalysis,1801.069087,False,0.0,False,1801.069087 +128e17b3-ec1f-4a61-836f-488b1390eec0,zai-org/GLM-4.5-Air-FP8,together_ai,sparql-university,8179,5198,13377,265.402405,False,0.0,zai-org/GLM-4.5-Air-FP8,sparql-university,265.402405,False,0.0,False,265.402405 +7ec5016b-f239-40e8-9d01-f49574de6133,OpenAI/gpt-oss-20B,together_ai,dna-assembly,2640,16529,19169,738.708681,False,0.0,OpenAI/gpt-oss-20B,dna-assembly,738.708681,False,0.0,False,738.708681 +f64e8006-7154-4174-a5b1-e8a638325b27,gpt-5-mini,openai,qemu-startup,2736,2069,4805,489.802463,True,1.0,gpt-5-mini,qemu-startup,489.802463,True,0.8,True,489.802463 +845efb28-c26a-40e9-9ee5-1c658d898fa4,zai-org/GLM-4.5-Air-FP8,together_ai,regex-log,2070,1903,3973,392.381113,True,1.0,zai-org/GLM-4.5-Air-FP8,regex-log,392.381113,True,0.2,True,392.381113 +e6e4c2ca-a0b8-4091-9195-f9446a5be443,gemini-2.5-pro,gemini,path-tracing-reverse,19227,16249,35476,1844.497132,False,0.0,gemini-2.5-pro,path-tracing-reverse,1844.497132,False,0.0,False,1844.497132 +eadc8fa7-6d3a-4c79-8a75-f653350965df,zai-org/GLM-4.5-Air-FP8,together_ai,torch-tensor-parallelism,2051,1800,3851,14.284388,False,0.0,zai-org/GLM-4.5-Air-FP8,torch-tensor-parallelism,14.284388,False,0.0,False,14.284388 +5288c6f2-556a-4003-95e7-60791d392cde,openai/gpt-oss-120b,together_ai,run-pdp11-code,6688,5131,11819,234.588641,False,0.0,openai/gpt-oss-120b,run-pdp11-code,234.588641,False,0.0,False,234.588641 +2b66e04a-d5f0-478a-bdbc-31fabcb68731,claude-sonnet-4-20250514,anthropic,filter-js-from-html,6396,6277,12673,490.116923,False,0.0,claude-sonnet-4-20250514,filter-js-from-html,490.116923,False,0.0,False,490.116923 +d3fcc935-7551-4958-a2c7-a5126341affb,zai-org/GLM-4.5-Air-FP8,together_ai,configure-git-webserver,6646,2624,9270,926.116323,False,0.0,zai-org/GLM-4.5-Air-FP8,configure-git-webserver,926.116323,False,0.0,False,926.116323 +2049d7fa-ee61-482a-815c-b65da781924b,gpt-5-mini,openai,video-processing,5950,5511,11461,217.833027,False,0.0,gpt-5-mini,video-processing,217.833027,False,0.0,False,217.833027 +2e71fcaf-1f3f-437b-816d-23f5499b06e5,gemini-2.5-flash,gemini,sparql-university,5129,2782,7911,161.246405,False,0.0,gemini-2.5-flash,sparql-university,161.246405,False,0.0,False,161.246405 +e467dd30-9015-4936-98a1-34023bc288b5,openai/gpt-oss-120b,together_ai,cancel-async-tasks,1245,648,1893,61.728873,True,1.0,openai/gpt-oss-120b,cancel-async-tasks,61.728873,True,0.6,True,61.728873 +80653225-189c-49c3-9a80-239fa55a962a,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-windows-3.11,11098,5444,16542,350.44511,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-windows-3.11,350.44511,False,0.0,False,350.44511 +cc48fed2-91d7-4c3f-8eda-ed44ed0966c5,deepseek-ai/DeepSeek-V3.1,together_ai,build-cython-ext,19280,6922,26202,476.681314,False,0.0,deepseek-ai/DeepSeek-V3.1,build-cython-ext,476.681314,False,0.0,False,476.681314 +85fe6953-69d1-4aee-b6d9-00cb15afc512,zai-org/GLM-4.5-Air-FP8,together_ai,port-compressor,47310,46255,93565,969.220147,False,0.0,zai-org/GLM-4.5-Air-FP8,port-compressor,969.220147,False,0.0,False,969.220147 +3be5bc00-4b96-4d4b-a7c2-b35028544c7b,gemini-2.5-pro,gemini,path-tracing,2317,2000,4317,286.591562,False,0.0,gemini-2.5-pro,path-tracing,286.591562,False,0.0,False,286.591562 +edca92f3-d1d0-4226-ae43-4a3982e6e439,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,log-summary-date-ranges,10233,3893,14126,290.677938,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,log-summary-date-ranges,290.677938,True,0.8,True,290.677938 +e3432469-bc98-4649-955f-c43d27d5eec5,grok-4-0709,xai,video-processing,1861,1091,2952,185.652558,False,0.0,grok-4-0709,video-processing,185.652558,False,0.0,False,185.652558 +ab4aeaa7-e721-4f7b-bbc2-23f1c82a79de,gemini-2.5-flash,gemini,distribution-search,17244,19178,36422,2288.844989,False,0.0,gemini-2.5-flash,distribution-search,2288.844989,False,0.0,False,2288.844989 +d6a7e673-c414-46a1-b2bd-65f3bdeb5a25,moonshotai/Kimi-K2-Instruct-0905,together_ai,wasm-pipeline,6688,7573,14261,829.864205,True,1.0,moonshotai/Kimi-K2-Instruct-0905,wasm-pipeline,829.864205,True,0.2,True,829.864205 +549774d0-43cc-4e20-81f3-d865a384156d,claude-sonnet-4-20250514,anthropic,dna-insert,5850,1456,7306,360.637374,False,0.0,claude-sonnet-4-20250514,dna-insert,360.637374,False,0.0,False,360.637374 +905cb864-7a06-47d4-a7cc-bfa647e1d097,claude-opus-4-1-20250805,anthropic,fix-ocaml-gc,29941,30317,60258,3604.894393,False,0.0,claude-opus-4-1-20250805,fix-ocaml-gc,3604.894393,False,0.5,False,3604.894393 +f61fa8a5-ab5a-41ed-a457-ca9dcc147cb5,OpenAI/gpt-oss-20B,together_ai,sparql-university,552,778,1330,136.629269,False,0.0,OpenAI/gpt-oss-20B,sparql-university,136.629269,False,0.0,False,136.629269 +9175c86e-8e5a-43f4-90e2-802bbae7f0a5,gemini-2.5-pro,gemini,git-leak-recovery,2127,1328,3455,179.399228,True,1.0,gemini-2.5-pro,git-leak-recovery,179.399228,True,1.0,True,179.399228 +c72da553-cf68-482d-aa1b-28d792bfb6cc,gpt-5,openai,reshard-c4-data,4664,7230,11894,900.050693,False,0.0,gpt-5,reshard-c4-data,900.050693,False,0.3333333333333333,False,900.050693 +390ea97a-778b-41ea-bb44-c524dc8df9d7,gpt-5-nano,openai,reverse-engineering,26042,11381,37423,1801.412052,False,0.0,gpt-5-nano,reverse-engineering,1801.412052,False,0.0,False,1801.412052 +4203ab45-55b1-4d42-a5c8-a1cae86b628f,gemini-2.5-flash,gemini,code-from-image,6341,4355,10696,355.965274,True,1.0,gemini-2.5-flash,code-from-image,355.965274,True,0.4,True,355.965274 +dba1d7ec-2b63-4c1c-8a97-582055238660,claude-sonnet-4-20250514,anthropic,hf-model-inference,6816,4555,11371,326.045056,False,0.0,claude-sonnet-4-20250514,hf-model-inference,326.045056,False,0.2,False,326.045056 +4c5acd84-198a-48f1-95cd-255cfb2b8101,zai-org/GLM-4.5-Air-FP8,together_ai,nginx-request-logging,7828,5219,13047,530.223748,True,1.0,zai-org/GLM-4.5-Air-FP8,nginx-request-logging,530.223748,True,1.0,True,530.223748 +881a261a-9ddc-4050-acbd-de862f6c5851,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-git,4765,3609,8374,328.626363,True,1.0,moonshotai/Kimi-K2-Instruct-0905,fix-git,328.626363,True,1.0,True,328.626363 +6ade59a9-97ae-41e5-ab64-d68f42099dbc,gpt-5,openai,vulnerable-secret,9401,7052,16453,900.001249,False,0.0,gpt-5,vulnerable-secret,900.001249,False,0.2857142857142857,False,900.001249 +6ff97d3e-14fe-4934-8945-cc795cf037e3,gpt-5-mini,openai,vulnerable-secret,7777,2944,10721,911.579853,False,0.0,gpt-5-mini,vulnerable-secret,911.579853,False,0.4,False,911.579853 +416ac3f4-67b2-4ee6-b8e2-a7803e3f3d8f,gemini-2.5-flash,gemini,sqlite-db-truncate,4096,5364,9460,924.676223,False,0.0,gemini-2.5-flash,sqlite-db-truncate,924.676223,False,0.0,False,924.676223 +f168d391-0770-427c-8bec-b272105f2439,deepseek-ai/DeepSeek-V3.1,together_ai,count-dataset-tokens,15410,4234,19644,616.656743,False,0.0,deepseek-ai/DeepSeek-V3.1,count-dataset-tokens,616.656743,False,0.0,False,616.656743 +1bf5a051-bb8f-43fd-a21d-0a9144ada50a,grok-4-0709,xai,prove-plus-comm,1732,1996,3728,904.255835,False,0.0,grok-4-0709,prove-plus-comm,904.255835,False,0.8,False,904.255835 +4c40dec6-6d4b-4fd5-8552-e0ee6ad2768b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,largest-eigenval,3968,3038,7006,913.220029,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,largest-eigenval,913.220029,False,0.0,False,913.220029 +eb3ee69a-a2c9-4619-a2db-a0d92cc6c8a0,gemini-2.5-pro,gemini,fix-code-vulnerability,10778,5997,16775,900.008762,False,0.0,gemini-2.5-pro,fix-code-vulnerability,900.008762,False,0.2,False,900.008762 +5f36c3b8-8bb8-44bf-b68e-8f19fa96c1dc,openai/gpt-oss-120b,together_ai,largest-eigenval,9818,9329,19147,921.148706,False,0.0,openai/gpt-oss-120b,largest-eigenval,921.148706,False,0.0,False,921.148706 +7a6e8762-3089-43db-916a-80eeb0ad1e75,claude-opus-4-1-20250805,anthropic,hf-model-inference,5102,3452,8554,171.021963,True,1.0,claude-opus-4-1-20250805,hf-model-inference,171.021963,True,0.25,True,171.021963 +961df3ac-84a2-42a7-8a33-d7ae773af3a1,deepseek-ai/DeepSeek-V3.1,together_ai,dna-assembly,10787,6654,17441,95.402357,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-assembly,95.402357,False,0.0,False,95.402357 +40cb4c1f-9bf1-40a5-bd54-c385e8b283a0,gemini-2.5-flash,gemini,wasm-pipeline,7672,6174,13846,682.407067,True,1.0,gemini-2.5-flash,wasm-pipeline,682.407067,True,0.4,True,682.407067 +6445caef-5deb-4dee-89b3-d502ddbe7e71,claude-opus-4-1-20250805,anthropic,fix-git,3387,1993,5380,173.755913,True,1.0,claude-opus-4-1-20250805,fix-git,173.755913,True,1.0,True,173.755913 +a1828aca-94e3-4360-ab4f-fa4197ce1938,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-mips-interpreter,23532,20222,43754,1807.904752,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-mips-interpreter,1807.904752,False,0.0,False,1807.904752 +32752537-4bb3-485b-acd0-f7f04d7b476f,gemini-2.5-flash,gemini,feal-differential-cryptanalysis,18641,53105,71746,1803.341612,False,0.0,gemini-2.5-flash,feal-differential-cryptanalysis,1803.341612,False,0.2,False,1803.341612 +d56f6a1b-b9c1-49a2-9dea-38e180430db7,OpenAI/gpt-oss-20B,together_ai,form-filling,6003,18299,24302,906.36875,False,0.0,OpenAI/gpt-oss-20B,form-filling,906.36875,False,0.0,False,906.36875 +eb7fbc0a-f5bd-46e8-9a16-47ba53568a8a,grok-4-0709,xai,configure-git-webserver,4554,1038,5592,537.516035,False,0.0,grok-4-0709,configure-git-webserver,537.516035,False,0.0,False,537.516035 +1fdd1600-720e-4a94-a715-c36ec8007b84,OpenAI/gpt-oss-20B,together_ai,run-pdp11-code,1345,2894,4239,279.488057,False,0.0,OpenAI/gpt-oss-20B,run-pdp11-code,279.488057,False,0.0,False,279.488057 +8d06c0ad-9258-48c7-b0cb-ff4932f77fd9,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-differential-cryptanalysis,8644,8613,17257,540.398693,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-differential-cryptanalysis,540.398693,False,0.0,False,540.398693 +0ab2a2c3-3e70-4e61-b6bc-6a371f18180c,claude-sonnet-4-20250514,anthropic,winning-avg-corewars,19691,19087,38778,1962.447596,False,0.0,claude-sonnet-4-20250514,winning-avg-corewars,1962.447596,False,0.0,False,1962.447596 +fa5d53e1-5fee-4256-bac0-d7ffbc7100b8,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pov-ray,18577,8331,26908,1080.864159,True,1.0,moonshotai/Kimi-K2-Instruct-0905,build-pov-ray,1080.864159,True,1.0,True,1080.864159 +ca928ae5-9635-4af4-907e-c3cdc9f0e2f4,gpt-5-nano,openai,path-tracing-reverse,2722,2309,5031,277.176631,False,0.0,gpt-5-nano,path-tracing-reverse,277.176631,False,0.0,False,277.176631 +59851ada-2785-4dd3-9a66-b68ee935e8ce,gpt-5-nano,openai,filter-js-from-html,1364,1047,2411,176.890287,False,0.0,gpt-5-nano,filter-js-from-html,176.890287,False,0.0,False,176.890287 +d9be2078-30c2-4de2-a095-53d2c0ed7253,deepseek-ai/DeepSeek-V3.1,together_ai,form-filling,6335,3737,10072,2067.753321,False,0.0,deepseek-ai/DeepSeek-V3.1,form-filling,2067.753321,False,0.8,False,2067.753321 +56f9b237-5bc6-43eb-86c5-9ed3dc3003ec,gpt-5-nano,openai,constraints-scheduling,8174,7640,15814,395.72651,False,0.0,gpt-5-nano,constraints-scheduling,395.72651,False,0.4,False,395.72651 +bc525386-45b2-4772-902c-65513e8adb60,grok-4-0709,xai,video-processing,1579,1641,3220,239.463111,False,0.0,grok-4-0709,video-processing,239.463111,False,0.0,False,239.463111 +83552a4c-811c-4cef-b811-775616315075,gpt-5-nano,openai,train-fasttext,9325,7302,16627,3600.000437,False,0.0,gpt-5-nano,train-fasttext,3600.000437,False,0.0,False,3600.000437 +4ada5ba2-e124-4f16-b1d7-f3196cfd1fff,OpenAI/gpt-oss-20B,together_ai,circuit-fibsqrt,271,1406,1677,78.605927,False,0.0,OpenAI/gpt-oss-20B,circuit-fibsqrt,78.605927,False,0.0,False,78.605927 +2801141f-7806-407c-8253-5288388fda09,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing,5029,6144,11173,1119.455138,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing,1119.455138,False,0.0,False,1119.455138 +7c1417e5-2e14-406e-8c63-dfa2066aeb6b,gpt-5-nano,openai,cancel-async-tasks,1308,1142,2450,100.905734,True,1.0,gpt-5-nano,cancel-async-tasks,100.905734,True,0.4,True,100.905734 +e212ca2d-37e8-4daa-a982-a7d2bd470bad,deepseek-ai/DeepSeek-V3.1,together_ai,crack-7z-hash,10254,5269,15523,730.519052,True,1.0,deepseek-ai/DeepSeek-V3.1,crack-7z-hash,730.519052,True,0.8,True,730.519052 +4d772dfc-a25e-4c74-9ee6-adb56a3a5d5d,grok-code-fast-1,xai,chess-best-move,6969,4882,11851,747.076536,False,0.0,grok-code-fast-1,chess-best-move,747.076536,False,0.0,False,747.076536 +3531b50a-5316-4e50-859c-1a99575eb5fb,gemini-2.5-flash,gemini,qemu-startup,1132,1068,2200,122.717458,False,0.0,gemini-2.5-flash,qemu-startup,122.717458,False,0.2,False,122.717458 +1316c1bc-bc3e-431f-b5a6-de43f86d1331,gpt-5,openai,reshard-c4-data,3263,5518,8781,626.964926,False,0.0,gpt-5,reshard-c4-data,626.964926,False,0.3333333333333333,False,626.964926 +e4ba06d7-4687-4dcb-b03f-e6b8ee40946c,grok-4-0709,xai,prove-plus-comm,2544,1353,3897,339.93954,True,1.0,grok-4-0709,prove-plus-comm,339.93954,True,0.8,True,339.93954 +33ead04b-d8d3-4b54-b232-4bc9421e7a8f,gpt-5-mini,openai,build-cython-ext,9997,4676,14673,901.121688,True,1.0,gpt-5-mini,build-cython-ext,901.121688,True,0.2,True,901.121688 +a38a3cae-6291-4236-9e2d-3d4383388866,gemini-2.5-flash,gemini,schemelike-metacircular-eval,17059,31766,48825,2401.401767,False,0.0,gemini-2.5-flash,schemelike-metacircular-eval,2401.401767,False,0.2,False,2401.401767 +6271509b-0b07-4d76-a653-3cc1c187a6d9,gpt-5-mini,openai,model-extraction-relu-logits,4519,3795,8314,327.181601,False,0.0,gpt-5-mini,model-extraction-relu-logits,327.181601,False,0.0,False,327.181601 +b961da7e-a721-4c05-b52b-75e8b035f040,claude-opus-4-1-20250805,anthropic,distribution-search,21831,16213,38044,987.774852,True,1.0,claude-opus-4-1-20250805,distribution-search,987.774852,True,0.5555555555555556,True,987.774852 +3b6ae06e-0b7c-47fa-81d2-7b082207e94b,claude-sonnet-4-20250514,anthropic,winning-avg-corewars,21287,21228,42515,3817.485632,False,0.0,claude-sonnet-4-20250514,winning-avg-corewars,3817.485632,False,0.0,False,3817.485632 +449e75d6-874d-4db1-986f-1ef70401564b,claude-opus-4-1-20250805,anthropic,fix-git,3644,1940,5584,94.675205,True,1.0,claude-opus-4-1-20250805,fix-git,94.675205,True,1.0,True,94.675205 +a72ef5f7-7d68-4082-a673-434f60ae3107,gpt-5-nano,openai,constraints-scheduling,3505,2709,6214,227.173906,True,1.0,gpt-5-nano,constraints-scheduling,227.173906,True,0.4,True,227.173906 +5ab76039-41b8-4155-b348-f32ff5c8cce2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cobol-modernization,6394,4489,10883,901.554932,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cobol-modernization,901.554932,True,0.4,True,901.554932 +07a36267-0f21-4f98-88db-732144ddff0f,openai/gpt-oss-120b,together_ai,make-doom-for-mips,2084,425,2509,966.58628,False,0.0,openai/gpt-oss-120b,make-doom-for-mips,966.58628,False,0.0,False,966.58628 +cf0ad0f1-34fe-4b91-9ff7-b224629be63c,gpt-5-nano,openai,qemu-startup,4203,5589,9792,900.477429,False,0.0,gpt-5-nano,qemu-startup,900.477429,False,0.0,False,900.477429 +3d46f0d9-7f95-42c8-8daa-6a115909702e,claude-sonnet-4-20250514,anthropic,count-dataset-tokens,12569,5421,17990,850.169258,False,0.0,claude-sonnet-4-20250514,count-dataset-tokens,850.169258,False,0.0,False,850.169258 +ae860e5c-7fea-4d0c-913e-dea5e3ba38c5,claude-opus-4-1-20250805,anthropic,break-filter-js-from-html,8881,7975,16856,1204.059704,True,1.0,claude-opus-4-1-20250805,break-filter-js-from-html,1204.059704,True,0.2222222222222222,True,1204.059704 +90195fc4-abd2-4ba3-8b83-4455e623e9d4,gemini-2.5-flash,gemini,crack-7z-hash,9449,5717,15166,556.26839,True,1.0,gemini-2.5-flash,crack-7z-hash,556.26839,True,0.8,True,556.26839 +2746a62c-e0ac-40e2-a840-5587149d8c57,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-mips-interpreter,32658,24263,56921,1800.515873,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-mips-interpreter,1800.515873,False,0.0,False,1800.515873 +d14ba659-84d1-40f4-b2b7-50edccf6a54a,grok-4-0709,xai,sqlite-db-truncate,3138,2324,5462,798.584089,False,0.0,grok-4-0709,sqlite-db-truncate,798.584089,False,0.0,False,798.584089 +361a1a5e-a9ed-4634-945c-c0cc72170616,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-rust-c,19024,20256,39280,923.808872,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-rust-c,923.808872,False,0.0,False,923.808872 +80ee59a5-1ed4-4853-825d-9067fad0e72d,gpt-5,openai,dna-insert,4923,5949,10872,360.010782,False,0.0,gpt-5,dna-insert,360.010782,False,0.0,False,360.010782 +18116941-f772-4f0e-8423-902d4c1c3d5b,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-leaderboard,5491,5164,10655,310.186324,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-leaderboard,310.186324,False,0.0,False,310.186324 +3069d20c-bed1-4b7b-8b71-385297a6c1ae,gpt-5,openai,cobol-modernization,5346,2869,8215,225.235422,True,1.0,gpt-5,cobol-modernization,225.235422,True,1.0,True,225.235422 +eea220be-b6c8-4983-a6ec-d57cde4fbb09,claude-sonnet-4-20250514,anthropic,write-compressor,8372,7798,16170,900.001485,False,0.0,claude-sonnet-4-20250514,write-compressor,900.001485,False,0.0,False,900.001485 +4c85aaad-6263-45ed-afdc-0df292c4a327,moonshotai/Kimi-K2-Instruct-0905,together_ai,model-extraction-relu-logits,8072,7542,15614,459.288541,True,1.0,moonshotai/Kimi-K2-Instruct-0905,model-extraction-relu-logits,459.288541,True,0.4,True,459.288541 +aa4c500f-9ac3-4d13-b2cd-d6b2a24a91ee,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,video-processing,2975,2204,5179,214.152491,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,video-processing,214.152491,False,0.0,False,214.152491 +898cac89-d695-46db-8ab4-5a67c86a074e,claude-opus-4-1-20250805,anthropic,bn-fit-modify,14181,4897,19078,312.339663,True,1.0,claude-opus-4-1-20250805,bn-fit-modify,312.339663,True,0.875,True,312.339663 +6e59ef96-22fa-41c3-baf3-b8ecaf4e9291,zai-org/GLM-4.5-Air-FP8,together_ai,qemu-startup,1297,2525,3822,900.013156,False,0.0,zai-org/GLM-4.5-Air-FP8,qemu-startup,900.013156,False,0.2,False,900.013156 +59a52a27-3faa-4c34-a0d1-4c318ec36dee,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-leaderboard,27273,8696,35969,2753.225711,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-leaderboard,2753.225711,False,0.0,False,2753.225711 +ae480f5e-5805-4eff-b63a-8e4b404112bd,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-git,4878,4061,8939,336.181738,True,1.0,moonshotai/Kimi-K2-Instruct-0905,fix-git,336.181738,True,1.0,True,336.181738 +01c15953-c7e0-404e-a07f-dae9b4ff9c2d,claude-opus-4-1-20250805,anthropic,sqlite-with-gcov,10620,1685,12305,433.157226,False,0.0,claude-opus-4-1-20250805,sqlite-with-gcov,433.157226,False,0.5714285714285714,False,433.157226 +3c0c81da-1f35-4a31-9c3c-cce417ea4545,OpenAI/gpt-oss-20B,together_ai,mteb-retrieve,1429,4966,6395,576.392569,False,0.0,OpenAI/gpt-oss-20B,mteb-retrieve,576.392569,False,0.0,False,576.392569 +bfa8feba-2a79-4350-81f7-54801cfe3ab2,openai/gpt-oss-120b,together_ai,pytorch-model-recovery,11139,8778,19917,903.385289,False,0.0,openai/gpt-oss-120b,pytorch-model-recovery,903.385289,False,0.4,False,903.385289 +686b746b-b3cf-46b7-8a7c-c2698d55cfab,grok-code-fast-1,xai,feal-differential-cryptanalysis,2474,1768,4242,148.443599,False,0.0,grok-code-fast-1,feal-differential-cryptanalysis,148.443599,False,0.0,False,148.443599 +a16bf79d-69fc-4f07-9bb9-f5bcad179bd8,grok-4-0709,xai,dna-insert,964,276,1240,361.224911,False,0.0,grok-4-0709,dna-insert,361.224911,False,0.0,False,361.224911 +2b308509-85fb-4fd3-a85b-bd75b18e481d,claude-sonnet-4-20250514,anthropic,path-tracing-reverse,7630,8696,16326,965.08116,False,0.0,claude-sonnet-4-20250514,path-tracing-reverse,965.08116,False,0.0,False,965.08116 +5ad21587-315d-4ece-894e-af0af09b3e77,gemini-2.5-flash,gemini,pypi-server,10964,4162,15126,376.132343,False,0.0,gemini-2.5-flash,pypi-server,376.132343,False,0.0,False,376.132343 +5448cde9-71e6-415f-8499-cfc4d2fb4870,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-leaderboard,2968,2240,5208,168.491044,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-leaderboard,168.491044,False,0.0,False,168.491044 +eb81fc2c-2f30-4d57-a29c-dc09b644b08c,claude-opus-4-1-20250805,anthropic,sanitize-git-repo,12849,3735,16584,704.858849,False,0.0,claude-opus-4-1-20250805,sanitize-git-repo,704.858849,False,0.0,False,704.858849 +8ad7e586-9d2b-4290-af2e-3f0e41a6474d,zai-org/GLM-4.5-Air-FP8,together_ai,gpt2-codegolf,21876,14162,36038,900.001642,False,0.0,zai-org/GLM-4.5-Air-FP8,gpt2-codegolf,900.001642,False,0.0,False,900.001642 +7bdac175-6fbd-4f65-924c-a5e6439c6c65,openai/gpt-oss-120b,together_ai,circuit-fibsqrt,6932,18772,25704,2855.665421,False,0.0,openai/gpt-oss-120b,circuit-fibsqrt,2855.665421,False,0.0,False,2855.665421 +8fb2ad7c-7b16-4470-82fe-37bfd913d0c0,grok-code-fast-1,xai,crack-7z-hash,9142,2605,11747,307.733225,True,1.0,grok-code-fast-1,crack-7z-hash,307.733225,True,0.6,True,307.733225 +f6c10a37-d9b6-4bec-94ab-62199b043b44,gpt-5-nano,openai,large-scale-text-editing,8840,9080,17920,1203.651723,False,0.0,gpt-5-nano,large-scale-text-editing,1203.651723,False,0.0,False,1203.651723 +c1e68c21-c76a-4e73-b2ab-d8aa37fd5c83,claude-opus-4-1-20250805,anthropic,crack-7z-hash,10467,3036,13503,217.612309,False,0.0,claude-opus-4-1-20250805,crack-7z-hash,217.612309,False,0.8888888888888888,False,217.612309 +44084ffe-ea1e-43a8-a734-6dc402078c66,gemini-2.5-flash,gemini,cobol-modernization,7266,6337,13603,553.277356,True,1.0,gemini-2.5-flash,cobol-modernization,553.277356,True,0.2,True,553.277356 +f9e68490-a9b1-4bb1-bee3-e03564d23215,gemini-2.5-pro,gemini,tune-mjcf,7147,6428,13575,929.426821,False,0.0,gemini-2.5-pro,tune-mjcf,929.426821,False,0.2,False,929.426821 +a03f6da2-4b7e-491c-9a75-e32c940eb0cc,gpt-5-mini,openai,sqlite-with-gcov,5956,1727,7683,179.188808,True,1.0,gpt-5-mini,sqlite-with-gcov,179.188808,True,1.0,True,179.188808 +67392217-1422-44be-b7a7-0bc59d5142eb,claude-opus-4-1-20250805,anthropic,train-fasttext,25237,9692,34929,2274.075464,True,1.0,claude-opus-4-1-20250805,train-fasttext,2274.075464,True,0.2857142857142857,True,2274.075464 +c28489cf-9ab3-4f4d-a0c9-518ff98323e7,gpt-5-mini,openai,reshard-c4-data,4818,4549,9367,301.946198,False,0.0,gpt-5-mini,reshard-c4-data,301.946198,False,0.0,False,301.946198 +81cd5f3d-2d04-4e32-8725-d673b504d24c,gpt-5-mini,openai,constraints-scheduling,4620,3724,8344,125.094261,True,1.0,gpt-5-mini,constraints-scheduling,125.094261,True,0.8,True,125.094261 +598a9242-7093-4737-a04a-cd53d5bec3d6,zai-org/GLM-4.5-Air-FP8,together_ai,port-compressor,42645,27973,70618,3619.726052,False,0.0,zai-org/GLM-4.5-Air-FP8,port-compressor,3619.726052,False,0.0,False,3619.726052 +cbcfc0b2-a823-4494-83fe-0902c4f62955,gemini-2.5-flash,gemini,polyglot-c-py,834,19918,20752,900.144219,False,0.0,gemini-2.5-flash,polyglot-c-py,900.144219,False,0.0,False,900.144219 +dc23566d-cd26-41f3-bbe1-27643dd3b562,claude-opus-4-1-20250805,anthropic,qemu-alpine-ssh,2123,1496,3619,289.950868,True,1.0,claude-opus-4-1-20250805,qemu-alpine-ssh,289.950868,True,0.8571428571428571,True,289.950868 +a8eeb70d-baf1-4ee5-9d4c-42cabd86063b,gemini-2.5-pro,gemini,fix-code-vulnerability,11019,4730,15749,966.169399,False,0.0,gemini-2.5-pro,fix-code-vulnerability,966.169399,False,0.2,False,966.169399 +0fd2cc0e-19f8-4c4d-b38b-c3213054f032,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-retrieve,1093,592,1685,89.418395,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-retrieve,89.418395,False,0.0,False,89.418395 +57c1989a-50ee-4c3b-bf67-13e2e5c00e26,grok-4-0709,xai,sqlite-with-gcov,3884,1953,5837,652.025607,False,0.0,grok-4-0709,sqlite-with-gcov,652.025607,False,0.0,False,652.025607 +c11658db-3f80-4a84-afb6-562cf84011da,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-db-truncate,5393,3033,8426,267.649291,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-db-truncate,267.649291,False,0.0,False,267.649291 +2571de58-8684-42ef-a825-4b8ee35fe5d5,gpt-5-mini,openai,build-pov-ray,6646,5294,11940,1755.048156,False,0.0,gpt-5-mini,build-pov-ray,1755.048156,False,0.0,False,1755.048156 +17466622-3065-468c-8b9a-4c64fbda183b,gpt-5-mini,openai,qemu-startup,3155,1968,5123,267.37671,False,0.0,gpt-5-mini,qemu-startup,267.37671,False,0.8,False,267.37671 +62fdd083-226e-4183-bbd8-88a6f12277e6,claude-sonnet-4-20250514,anthropic,torch-tensor-parallelism,3504,2707,6211,185.69269,False,0.0,claude-sonnet-4-20250514,torch-tensor-parallelism,185.69269,False,0.0,False,185.69269 +c0073804-2144-4929-84d3-328610350b0f,gpt-5-nano,openai,merge-diff-arc-agi-task,7954,4557,12511,587.703042,False,0.0,gpt-5-nano,merge-diff-arc-agi-task,587.703042,False,0.2,False,587.703042 +3fd577a7-20de-4eaa-9c93-63dee9019e49,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-mips-interpreter,15360,12445,27805,1808.34095,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-mips-interpreter,1808.34095,False,0.0,False,1808.34095 +9e259cdf-dbfb-47c8-9766-540e0a15b510,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pypi-server,13235,5187,18422,718.81295,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pypi-server,718.81295,False,0.2,False,718.81295 +ff9f5194-ac5f-46b7-bec8-4931295074d3,gemini-2.5-pro,gemini,filter-js-from-html,3557,2795,6352,678.564274,False,0.0,gemini-2.5-pro,filter-js-from-html,678.564274,False,0.0,False,678.564274 +48b71008-c2b6-4017-bc13-2358365793da,OpenAI/gpt-oss-20B,together_ai,winning-avg-corewars,224,311,535,53.578473,False,0.0,OpenAI/gpt-oss-20B,winning-avg-corewars,53.578473,False,0.0,False,53.578473 +665dc520-f100-4932-b763-60cd5f16ef59,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-alpine-ssh,2672,4120,6792,1044.974533,False,0.0,moonshotai/Kimi-K2-Instruct-0905,qemu-alpine-ssh,1044.974533,False,0.0,False,1044.974533 +43db5e39-7beb-404e-ad93-1ceda10aa853,grok-code-fast-1,xai,pypi-server,2316,973,3289,99.855592,False,0.0,grok-code-fast-1,pypi-server,99.855592,False,0.8,False,99.855592 +f3bee811-1337-40bc-b1bc-7ed8088e56ec,grok-code-fast-1,xai,gpt2-codegolf,1206,776,1982,34.891083,False,0.0,grok-code-fast-1,gpt2-codegolf,34.891083,False,0.0,False,34.891083 +2de09c9a-22a0-49ff-9db9-61d2add03b76,gemini-2.5-pro,gemini,video-processing,3172,2421,5593,301.453438,False,0.0,gemini-2.5-pro,video-processing,301.453438,False,0.0,False,301.453438 +e83d15c2-7116-4d80-b00a-1b38b98b4200,gemini-2.5-pro,gemini,count-dataset-tokens,14245,2587,16832,904.549244,False,0.0,gemini-2.5-pro,count-dataset-tokens,904.549244,False,0.0,False,904.549244 +2ebc23fc-7ddb-41c6-832b-62bbf31be73e,OpenAI/gpt-oss-20B,together_ai,configure-git-webserver,3459,1004,4463,356.76794,False,0.0,OpenAI/gpt-oss-20B,configure-git-webserver,356.76794,False,0.2,False,356.76794 +a4418230-04b9-43c8-94f2-5705649cc023,gpt-5-mini,openai,crack-7z-hash,6116,6500,12616,900.025975,False,0.0,gpt-5-mini,crack-7z-hash,900.025975,False,0.0,False,900.025975 +1aae83f7-f423-4910-93f9-bbc66cb8a7dd,moonshotai/Kimi-K2-Instruct-0905,together_ai,nginx-request-logging,6083,3919,10002,928.656158,True,1.0,moonshotai/Kimi-K2-Instruct-0905,nginx-request-logging,928.656158,True,0.4,True,928.656158 +97275d32-d710-410c-8ca8-0a84a9b187f7,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-c-py,16590,10708,27298,900.001377,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-c-py,900.001377,False,0.0,False,900.001377 +dd4f3027-2b94-401c-814f-e33efb8c1fc9,zai-org/GLM-4.5-Air-FP8,together_ai,write-compressor,6141,10378,16519,831.477683,False,0.0,zai-org/GLM-4.5-Air-FP8,write-compressor,831.477683,False,0.0,False,831.477683 +2edd6578-4c27-4cb1-bd17-d334a821eeaf,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,constraints-scheduling,2301,3215,5516,163.750145,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,constraints-scheduling,163.750145,False,0.0,False,163.750145 +c5916c9e-6a5c-4039-a38b-580fe23ed69e,gpt-5-mini,openai,sanitize-git-repo,1792,5499,7291,900.597739,False,0.0,gpt-5-mini,sanitize-git-repo,900.597739,False,0.0,False,900.597739 +f652c17f-8af2-414e-8c2b-3b87c4c9fd96,gemini-2.5-flash,gemini,tune-mjcf,7429,4683,12112,608.146811,True,1.0,gemini-2.5-flash,tune-mjcf,608.146811,True,0.6,True,608.146811 +f0579349-bf5f-4ab0-9dc8-b1428c3242cb,grok-code-fast-1,xai,extract-elf,8076,4002,12078,301.160626,True,1.0,grok-code-fast-1,extract-elf,301.160626,True,0.6,True,301.160626 +1b2f8bc8-778e-4965-b0f7-fd8865be8a0d,gemini-2.5-pro,gemini,dna-insert,5544,1319,6863,368.076838,False,0.0,gemini-2.5-pro,dna-insert,368.076838,False,0.0,False,368.076838 +4e72d6df-728e-4dc0-b20c-300dc694fb78,gemini-2.5-flash,gemini,sanitize-git-repo,12322,2875,15197,233.104675,False,0.0,gemini-2.5-flash,sanitize-git-repo,233.104675,False,0.0,False,233.104675 +c160dcdd-00fc-4e0f-86f4-515c46ec29f3,gemini-2.5-pro,gemini,extract-elf,7215,1812,9027,356.41755,False,0.0,gemini-2.5-pro,extract-elf,356.41755,False,0.0,False,356.41755 +63d234a3-5e5c-4d44-b55c-891a3269df5d,zai-org/GLM-4.5-Air-FP8,together_ai,build-cython-ext,17081,4126,21207,900.006475,False,0.0,zai-org/GLM-4.5-Air-FP8,build-cython-ext,900.006475,False,0.0,False,900.006475 +62815651-ed06-4c4d-88a3-ebeab792569d,grok-4-0709,xai,sqlite-with-gcov,9752,2532,12284,697.407031,False,0.0,grok-4-0709,sqlite-with-gcov,697.407031,False,0.0,False,697.407031 +42eb86df-8898-4b17-b42c-d060dec3261c,grok-code-fast-1,xai,tune-mjcf,6446,6261,12707,707.711044,True,1.0,grok-code-fast-1,tune-mjcf,707.711044,True,0.4,True,707.711044 +8cad6437-ceed-4123-9a83-ec4f36f5e90f,gemini-2.5-flash,gemini,sanitize-git-repo,15242,3726,18968,231.436895,False,0.0,gemini-2.5-flash,sanitize-git-repo,231.436895,False,0.0,False,231.436895 +c2979f38-57fd-4840-8a52-8f2f1fd0dcd8,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-leaderboard,5024,8239,13263,398.055009,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-leaderboard,398.055009,False,0.0,False,398.055009 +2c9e6ad1-f533-426b-a6fd-932ca3c937f1,zai-org/GLM-4.5-Air-FP8,together_ai,constraints-scheduling,9760,8863,18623,400.99791,False,0.0,zai-org/GLM-4.5-Air-FP8,constraints-scheduling,400.99791,False,0.8,False,400.99791 +10aaf009-27a2-4b61-9eb8-c1516b7b8bf0,grok-code-fast-1,xai,train-fasttext,11734,4440,16174,1162.404317,False,0.0,grok-code-fast-1,train-fasttext,1162.404317,False,0.0,False,1162.404317 +02f46f7e-0aba-4caf-a7f4-c34fb818c903,claude-opus-4-1-20250805,anthropic,vulnerable-secret,5802,4670,10472,418.521487,True,1.0,claude-opus-4-1-20250805,vulnerable-secret,418.521487,True,0.625,True,418.521487 +92e85f30-8eca-4068-8444-d23552bc115d,grok-code-fast-1,xai,adaptive-rejection-sampler,10298,4303,14601,283.63497,False,0.0,grok-code-fast-1,adaptive-rejection-sampler,283.63497,False,0.0,False,283.63497 +9f8db136-602e-4c03-9175-61a967263e50,gpt-5,openai,pypi-server,3050,1566,4616,182.954646,True,1.0,gpt-5,pypi-server,182.954646,True,0.3333333333333333,True,182.954646 +ad4f1c3e-1869-48f7-87f0-9886d79df776,gpt-5-mini,openai,regex-log,1699,1371,3070,163.535429,True,1.0,gpt-5-mini,regex-log,163.535429,True,0.8,True,163.535429 +44489547-cc5c-4603-92da-ea05b00d257c,claude-opus-4-1-20250805,anthropic,large-scale-text-editing,7392,8601,15993,535.524466,True,1.0,claude-opus-4-1-20250805,large-scale-text-editing,535.524466,True,0.6666666666666666,True,535.524466 +5156ccac-113d-4a64-8dcd-bb3153ab89b5,OpenAI/gpt-oss-20B,together_ai,crack-7z-hash,1043,267,1310,24.209075,False,0.0,OpenAI/gpt-oss-20B,crack-7z-hash,24.209075,False,0.0,False,24.209075 +d593c474-e661-4e82-b792-3f9d10ba32e7,gpt-5-nano,openai,password-recovery,2369,4387,6756,913.197578,False,0.0,gpt-5-nano,password-recovery,913.197578,False,0.0,False,913.197578 +61fadb13-c0d8-4c67-a51e-0748db8deb9c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-rust-c,3609,2711,6320,209.510837,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-rust-c,209.510837,False,0.0,False,209.510837 +790e2529-d424-46a6-947b-5d207053c57b,OpenAI/gpt-oss-20B,together_ai,circuit-fibsqrt,5766,19115,24881,2432.870014,False,0.0,OpenAI/gpt-oss-20B,circuit-fibsqrt,2432.870014,False,0.0,False,2432.870014 +182654d0-a890-44f5-a277-3fc3ec0e945b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,wasm-pipeline,2763,1815,4578,108.523803,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,wasm-pipeline,108.523803,False,0.0,False,108.523803 +30ea6998-7bf6-4c27-a0f3-820a80c5acf7,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-rust-c,13351,12696,26047,883.643068,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-rust-c,883.643068,False,0.0,False,883.643068 +8f7b2626-e5bd-46e6-9a86-ac5425a89f9a,gemini-2.5-pro,gemini,polyglot-c-py,1691,1374,3065,151.89027,False,0.0,gemini-2.5-pro,polyglot-c-py,151.89027,False,0.2,False,151.89027 +d824c6a6-bce5-4eb8-a196-6c4acb3c226a,gpt-5-mini,openai,path-tracing-reverse,5918,1528,7446,127.758521,False,0.0,gpt-5-mini,path-tracing-reverse,127.758521,False,0.0,False,127.758521 +bdf9e342-ef02-49a6-8e19-f86caf176a0b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,password-recovery,2865,2370,5235,196.82905,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,password-recovery,196.82905,False,0.0,False,196.82905 +e202023c-29a7-4e16-b0c4-1e18ec6cbd91,deepseek-ai/DeepSeek-V3.1,together_ai,sparql-university,4993,2084,7077,188.5622,False,0.0,deepseek-ai/DeepSeek-V3.1,sparql-university,188.5622,False,0.0,False,188.5622 +7f64cd27-88f1-428a-b0f3-c6384f56e87b,claude-sonnet-4-20250514,anthropic,nginx-request-logging,4533,3227,7760,491.848489,True,1.0,claude-sonnet-4-20250514,nginx-request-logging,491.848489,True,1.0,True,491.848489 +b6ed6150-7d59-401d-9c59-d2d400d23ab2,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,db-wal-recovery,2575,1798,4373,414.862851,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,db-wal-recovery,414.862851,False,0.0,False,414.862851 +5e91e6d4-f503-43f3-8689-d04f56832f19,grok-4-0709,xai,model-extraction-relu-logits,1172,1368,2540,900.119196,False,0.0,grok-4-0709,model-extraction-relu-logits,900.119196,False,0.0,False,900.119196 +4a54a613-a835-4723-84ea-dc8e3ee54a66,gemini-2.5-pro,gemini,crack-7z-hash,12359,5921,18280,904.810536,False,0.0,gemini-2.5-pro,crack-7z-hash,904.810536,False,0.8,False,904.810536 +0148ddbb-9c20-4c80-bd8a-fef94dd3bb3f,zai-org/GLM-4.5-Air-FP8,together_ai,reverse-engineering,17222,15042,32264,1800.102118,False,0.0,zai-org/GLM-4.5-Air-FP8,reverse-engineering,1800.102118,False,0.0,False,1800.102118 +c0ea14c1-d2f2-4cb3-bf51-1ee91c6dd330,gemini-2.5-flash,gemini,crack-7z-hash,8968,4396,13364,327.482622,True,1.0,gemini-2.5-flash,crack-7z-hash,327.482622,True,0.8,True,327.482622 +d5bfd68d-bb07-4ac4-aa84-5db9e85c0885,OpenAI/gpt-oss-20B,together_ai,openssl-selfsigned-cert,2050,1218,3268,76.609029,False,0.0,OpenAI/gpt-oss-20B,openssl-selfsigned-cert,76.609029,False,0.2,False,76.609029 +91e7e2f5-9bff-4120-b8ad-287df4753714,gpt-5,openai,db-wal-recovery,7575,7224,14799,903.651288,False,0.0,gpt-5,db-wal-recovery,903.651288,False,0.1428571428571428,False,903.651288 +aa4326ef-b6a7-4884-ab0d-f40bfaddb2d7,claude-sonnet-4-20250514,anthropic,sanitize-git-repo,15573,6498,22071,784.537945,False,0.0,claude-sonnet-4-20250514,sanitize-git-repo,784.537945,False,0.0,False,784.537945 +47ac79e5-9e41-4f58-8750-d1c8f2502dec,grok-code-fast-1,xai,sanitize-git-repo,2797,1869,4666,93.022018,False,0.0,grok-code-fast-1,sanitize-git-repo,93.022018,False,0.0,False,93.022018 +ebcc6278-5a5a-44bb-9781-6921c6f38b29,claude-opus-4-1-20250805,anthropic,path-tracing-reverse,33234,23016,56250,1800.032101,False,0.0,claude-opus-4-1-20250805,path-tracing-reverse,1800.032101,False,0.0,False,1800.032101 +c35e2e8f-9cfc-43f0-8015-5da494476702,deepseek-ai/DeepSeek-V3.1,together_ai,chess-best-move,10545,5337,15882,888.240521,False,0.0,deepseek-ai/DeepSeek-V3.1,chess-best-move,888.240521,False,0.0,False,888.240521 +4c2f3126-31c8-4171-93c4-9751e7c410a8,gemini-2.5-pro,gemini,reshard-c4-data,6064,4218,10282,554.952568,False,0.0,gemini-2.5-pro,reshard-c4-data,554.952568,False,0.0,False,554.952568 +b120f3bf-a8ca-4024-9e62-64e5d9e28946,gpt-5,openai,hf-model-inference,4015,1635,5650,312.829563,True,1.0,gpt-5,hf-model-inference,312.829563,True,1.0,True,312.829563 +2decb33d-6acf-44cb-8ab8-12e8905f8e56,claude-opus-4-1-20250805,anthropic,sqlite-db-truncate,9145,5907,15052,205.694099,False,0.0,claude-opus-4-1-20250805,sqlite-db-truncate,205.694099,False,0.125,False,205.694099 +65b0dcb8-abb9-4d90-8d84-9cee6791cfe5,deepseek-ai/DeepSeek-V3.1,together_ai,fix-code-vulnerability,15128,6822,21950,541.276845,True,1.0,deepseek-ai/DeepSeek-V3.1,fix-code-vulnerability,541.276845,True,0.2,True,541.276845 +1cd8ad5e-b8a6-4758-8387-ff734e24ed01,gpt-5-nano,openai,cobol-modernization,13241,15325,28566,900.012195,True,1.0,gpt-5-nano,cobol-modernization,900.012195,True,0.4,True,900.012195 +39b89f45-4be4-4f58-976a-004c9eeb02f3,OpenAI/gpt-oss-20B,together_ai,reverse-engineering,1485,2145,3630,343.11882,False,0.0,OpenAI/gpt-oss-20B,reverse-engineering,343.11882,False,0.0,False,343.11882 +5b5bac83-1493-4690-b0c2-b0fa909b3f93,claude-sonnet-4-20250514,anthropic,large-scale-text-editing,2878,2194,5072,222.134031,True,1.0,claude-sonnet-4-20250514,large-scale-text-editing,222.134031,True,0.6,True,222.134031 +55bfe684-05df-4cfd-b629-4a699cc0d931,openai/gpt-oss-120b,together_ai,count-dataset-tokens,1416,1186,2602,189.466334,False,0.0,openai/gpt-oss-120b,count-dataset-tokens,189.466334,False,0.0,False,189.466334 +1030e132-a2cc-4bde-b03e-ea3d8d6ee380,gpt-5-mini,openai,make-doom-for-mips,12573,9482,22055,902.864994,False,0.0,gpt-5-mini,make-doom-for-mips,902.864994,False,0.0,False,902.864994 +c45a7639-2529-4821-874e-f8736b1d4bd5,grok-4-0709,xai,feal-linear-cryptanalysis,3600,994,4594,1801.016086,False,0.0,grok-4-0709,feal-linear-cryptanalysis,1801.016086,False,0.0,False,1801.016086 +802f94ac-5233-475f-af91-e7ca67833fd4,grok-code-fast-1,xai,mteb-retrieve,1635,623,2258,80.889906,False,0.0,grok-code-fast-1,mteb-retrieve,80.889906,False,0.0,False,80.889906 +83591efe-5a9e-4f61-811c-521af2c39eac,grok-4-0709,xai,fix-ocaml-gc,16482,5318,21800,3697.597806,False,0.0,grok-4-0709,fix-ocaml-gc,3697.597806,False,0.0,False,3697.597806 +de14bcba-3abd-4a85-9015-5f558009014b,gemini-2.5-flash,gemini,make-mips-interpreter,6505,13662,20167,1800.612837,False,0.0,gemini-2.5-flash,make-mips-interpreter,1800.612837,False,0.0,False,1800.612837 +ebf4450e-6699-45ff-a837-a4ecb300cf9b,grok-4-0709,xai,feal-linear-cryptanalysis,16296,6683,22979,1814.053289,False,0.0,grok-4-0709,feal-linear-cryptanalysis,1814.053289,False,0.0,False,1814.053289 +d59d5a20-f553-4305-b7ae-09fca34aa8c8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-retrieve,14922,4770,19692,692.044962,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-retrieve,692.044962,False,0.0,False,692.044962 +d0854df0-1c07-4d90-bb05-55c256631343,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-c-py,6220,2773,8993,117.323132,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-c-py,117.323132,False,0.0,False,117.323132 +65dc8e91-4011-4262-81ff-276fa36d6d43,claude-opus-4-1-20250805,anthropic,path-tracing,10906,9052,19958,977.47282,False,0.0,claude-opus-4-1-20250805,path-tracing,977.47282,False,0.0,False,977.47282 +4c591c36-a783-4cac-bec6-27deca072d9f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-alpine-ssh,2307,2377,4684,1042.147924,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-alpine-ssh,1042.147924,False,0.2,False,1042.147924 +2f141cf1-85a6-4582-a4cf-1b8d7e98a967,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,run-pdp11-code,1712,1154,2866,1064.575988,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,run-pdp11-code,1064.575988,False,0.0,False,1064.575988 +ea493867-f535-4e01-bf8c-9778da51c90d,gemini-2.5-pro,gemini,build-cython-ext,13411,4750,18161,930.140354,False,0.0,gemini-2.5-pro,build-cython-ext,930.140354,False,0.0,False,930.140354 +3a29b6e7-1db4-4554-b6c0-99d82106a63f,moonshotai/Kimi-K2-Instruct-0905,together_ai,cobol-modernization,8884,7082,15966,900.016399,False,0.0,moonshotai/Kimi-K2-Instruct-0905,cobol-modernization,900.016399,False,0.6,False,900.016399 +086eee7f-9cf0-4ed2-a5ff-7e543c73a31f,gpt-5-mini,openai,bn-fit-modify,10414,6077,16491,596.082064,True,1.0,gpt-5-mini,bn-fit-modify,596.082064,True,0.6,True,596.082064 +9de18010-b7ef-4297-9314-0394eff7277e,OpenAI/gpt-oss-20B,together_ai,path-tracing,7114,23993,31107,1823.319191,False,0.0,OpenAI/gpt-oss-20B,path-tracing,1823.319191,False,0.0,False,1823.319191 +c1c5b36c-b26f-40fa-9537-95af9172895a,gpt-5,openai,merge-diff-arc-agi-task,7862,4486,12348,443.221105,True,1.0,gpt-5,merge-diff-arc-agi-task,443.221105,True,1.0,True,443.221105 +5538baed-4a30-4d58-912c-42fdf6c3cd1d,gemini-2.5-pro,gemini,qemu-startup,1192,804,1996,198.950849,False,0.0,gemini-2.5-pro,qemu-startup,198.950849,False,0.2,False,198.950849 +74c86c47-f47a-495e-b6a3-8eb1cc86fd50,gpt-5-mini,openai,git-leak-recovery,4236,4538,8774,901.421608,False,0.0,gpt-5-mini,git-leak-recovery,901.421608,False,0.0,False,901.421608 +2285b1a1-3b56-4727-a8c2-5bb7cea85005,zai-org/GLM-4.5-Air-FP8,together_ai,run-pdp11-code,12804,13798,26602,644.675568,False,0.0,zai-org/GLM-4.5-Air-FP8,run-pdp11-code,644.675568,False,0.0,False,644.675568 +0d0edd5d-051e-4539-9cc1-416a7ff82abb,gpt-5-mini,openai,db-wal-recovery,12242,10574,22816,488.102633,False,0.0,gpt-5-mini,db-wal-recovery,488.102633,False,0.0,False,488.102633 +3419b2e9-3ed1-4023-a468-6727a860e5c1,gpt-5-nano,openai,make-mips-interpreter,15345,10772,26117,1804.836996,False,0.0,gpt-5-nano,make-mips-interpreter,1804.836996,False,0.0,False,1804.836996 +ea2a6674-e248-495d-b33a-324116f6a87f,openai/gpt-oss-120b,together_ai,large-scale-text-editing,2407,1802,4209,169.447121,False,0.0,openai/gpt-oss-120b,large-scale-text-editing,169.447121,False,0.0,False,169.447121 +6e2c0a75-16bd-4296-bc9c-5610f0581d7f,deepseek-ai/DeepSeek-V3.1,together_ai,write-compressor,6114,6854,12968,917.610836,False,0.0,deepseek-ai/DeepSeek-V3.1,write-compressor,917.610836,False,0.0,False,917.610836 +8aa1f7e6-dbb8-4c35-87dc-7e2d63266444,claude-sonnet-4-20250514,anthropic,financial-document-processor,18596,11113,29709,1027.384662,False,0.0,claude-sonnet-4-20250514,financial-document-processor,1027.384662,False,0.2,False,1027.384662 +fda7af6e-37d3-4539-8f51-08e0aa759d01,openai/gpt-oss-120b,together_ai,schemelike-metacircular-eval,5896,2631,8527,96.662482,False,0.0,openai/gpt-oss-120b,schemelike-metacircular-eval,96.662482,False,0.0,False,96.662482 +01e7ea3d-e15d-44fd-a84d-1d33afeef2f6,gemini-2.5-pro,gemini,password-recovery,5277,4947,10224,901.07837,False,0.0,gemini-2.5-pro,password-recovery,901.07837,False,0.0,False,901.07837 +6448dab5-d962-4835-9f21-2ebf832e1c68,gemini-2.5-pro,gemini,reverse-engineering,15795,10082,25877,1806.484505,False,0.0,gemini-2.5-pro,reverse-engineering,1806.484505,False,0.0,False,1806.484505 +5b89640d-4b7e-4772-b805-39d81caa017e,gpt-5,openai,polyglot-rust-c,1553,1709,3262,900.007167,False,0.0,gpt-5,polyglot-rust-c,900.007167,False,0.0,False,900.007167 +a037118f-0681-4c65-a731-72bd3e2159ca,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,form-filling,6481,3871,10352,249.79161,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,form-filling,249.79161,False,0.0,False,249.79161 +865ec16e-2043-40be-ba01-02077e6f2043,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,constraints-scheduling,8338,12285,20623,1129.035961,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,constraints-scheduling,1129.035961,True,1.0,True,1129.035961 +1a723b17-4731-4f68-bd20-c1789dabf8ea,grok-4-0709,xai,pytorch-model-recovery,4566,2931,7497,903.574306,False,0.0,grok-4-0709,pytorch-model-recovery,903.574306,False,0.2,False,903.574306 +1bb8f992-8194-41e7-9883-fb16c90a7b22,zai-org/GLM-4.5-Air-FP8,together_ai,password-recovery,7099,5891,12990,702.088208,False,0.0,zai-org/GLM-4.5-Air-FP8,password-recovery,702.088208,False,0.0,False,702.088208 +4b1fd819-805b-43c9-9afe-8ac46704b634,claude-opus-4-1-20250805,anthropic,fix-code-vulnerability,15666,5669,21335,980.795787,False,0.0,claude-opus-4-1-20250805,fix-code-vulnerability,980.795787,False,0.125,False,980.795787 +3024e72e-2c78-48bc-aa7a-8da2915a1b92,claude-opus-4-1-20250805,anthropic,adaptive-rejection-sampler,13766,10571,24337,906.380667,False,0.0,claude-opus-4-1-20250805,adaptive-rejection-sampler,906.380667,False,0.125,False,906.380667 +695f2f2e-32dc-4362-aaa2-474e703e8615,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-alpine-ssh,3804,6456,10260,903.293499,False,0.0,deepseek-ai/DeepSeek-V3.1,qemu-alpine-ssh,903.293499,False,0.2,False,903.293499 +31481f3f-1733-40df-9020-3bed9c3f3bda,grok-4-0709,xai,winning-avg-corewars,4216,1846,6062,713.651057,False,0.0,grok-4-0709,winning-avg-corewars,713.651057,False,0.0,False,713.651057 +196c9b7a-0588-4921-906f-2f3b13dc9920,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-code-vulnerability,18626,9582,28208,592.381116,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-code-vulnerability,592.381116,False,0.0,False,592.381116 +30f4fee6-65ac-45c8-aae0-14db8e776602,grok-code-fast-1,xai,db-wal-recovery,4682,4263,8945,511.038757,False,0.0,grok-code-fast-1,db-wal-recovery,511.038757,False,0.0,False,511.038757 +6f7e81f4-2106-46ce-a146-1117b652b5b9,gpt-5-nano,openai,install-klee-minimal,5251,3371,8622,906.13521,False,0.0,gpt-5-nano,install-klee-minimal,906.13521,False,0.0,False,906.13521 +a3c98cf9-d56b-4fbc-9a8c-a8cfdb840c44,gpt-5,openai,db-wal-recovery,11701,13205,24906,900.001769,False,0.0,gpt-5,db-wal-recovery,900.001769,False,0.1428571428571428,False,900.001769 +fc2416d9-465b-445d-aa6d-960f885722e8,zai-org/GLM-4.5-Air-FP8,together_ai,feal-linear-cryptanalysis,23837,33532,57369,1260.432391,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-linear-cryptanalysis,1260.432391,False,0.0,False,1260.432391 +126dcbb7-324d-4173-9e3c-26705b83baaa,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,count-dataset-tokens,7587,1633,9220,177.997661,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,count-dataset-tokens,177.997661,False,0.0,False,177.997661 +cd448acc-9fd1-456c-9528-3869a2eeb6e0,gemini-2.5-pro,gemini,train-fasttext,15925,5735,21660,3601.220383,False,0.0,gemini-2.5-pro,train-fasttext,3601.220383,False,0.0,False,3601.220383 +5ba4a7ec-fb21-42bb-8ad6-ab6fc457ad14,gemini-2.5-pro,gemini,pytorch-model-recovery,6408,3483,9891,303.492384,True,1.0,gemini-2.5-pro,pytorch-model-recovery,303.492384,True,1.0,True,303.492384 +25041241-7c70-4d3b-88df-9a4fd0b2f253,grok-code-fast-1,xai,qemu-startup,1022,817,1839,110.70126,False,0.0,grok-code-fast-1,qemu-startup,110.70126,False,0.0,False,110.70126 +8cdf973c-ce6d-41a8-8b6e-f61b8a5607fd,gpt-5,openai,constraints-scheduling,4832,4234,9066,174.712709,False,0.0,gpt-5,constraints-scheduling,174.712709,False,0.8571428571428571,False,174.712709 +87f22486-c143-4c00-b7a1-1ef07f5d4862,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-c-py,2378,2066,4444,989.25217,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-c-py,989.25217,False,0.0,False,989.25217 +46075612-92dd-4445-b27b-76dd2711cbdc,claude-sonnet-4-20250514,anthropic,pytorch-model-recovery,8074,5555,13629,901.875033,True,1.0,claude-sonnet-4-20250514,pytorch-model-recovery,901.875033,True,1.0,True,901.875033 +7c3c447d-b445-4dc5-8b66-411e925dd48f,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-leaderboard,3117,1841,4958,177.014717,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-leaderboard,177.014717,False,0.0,False,177.014717 +b42b8e90-2dd3-412e-8d4b-452f43d9cd23,gpt-5-nano,openai,sparql-university,15415,10085,25500,908.425454,False,0.0,gpt-5-nano,sparql-university,908.425454,False,0.0,False,908.425454 +a4907b05-ef73-49ab-9f37-4937ad5de09c,gpt-5-mini,openai,bn-fit-modify,11337,11817,23154,458.541134,True,1.0,gpt-5-mini,bn-fit-modify,458.541134,True,0.6,True,458.541134 +e9996573-f61f-4367-ac8f-bf03cbd6f27e,gpt-5-nano,openai,pytorch-model-recovery,10502,10001,20503,900.822114,False,0.0,gpt-5-nano,pytorch-model-recovery,900.822114,False,0.0,False,900.822114 +4c6df88d-e11b-4190-9d5e-9a05ff440c20,openai/gpt-oss-120b,together_ai,reshard-c4-data,3321,2585,5906,163.610161,False,0.0,openai/gpt-oss-120b,reshard-c4-data,163.610161,False,0.0,False,163.610161 +9a968ce0-e84e-4f35-a35b-6dea268270fc,zai-org/GLM-4.5-Air-FP8,together_ai,pypi-server,10035,4238,14273,900.026183,False,0.0,zai-org/GLM-4.5-Air-FP8,pypi-server,900.026183,False,0.2,False,900.026183 +1f0839c9-5660-4b3b-8d7f-c9a033e50aec,claude-opus-4-1-20250805,anthropic,count-dataset-tokens,13466,3071,16537,175.192597,False,0.0,claude-opus-4-1-20250805,count-dataset-tokens,175.192597,False,0.0,False,175.192597 +56cc63ee-de99-477c-99ef-545b42f6be54,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-retrieve,2474,1371,3845,118.603113,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-retrieve,118.603113,False,0.0,False,118.603113 +b1b73a7c-6385-4a4c-89bd-70fdba0eda5f,gpt-5-mini,openai,break-filter-js-from-html,2655,1643,4298,334.171093,False,0.0,gpt-5-mini,break-filter-js-from-html,334.171093,False,0.0,False,334.171093 +cbf27075-def5-4941-83f2-c5d72d4a3357,deepseek-ai/DeepSeek-V3.1,together_ai,schemelike-metacircular-eval,17215,12706,29921,2452.70064,False,0.0,deepseek-ai/DeepSeek-V3.1,schemelike-metacircular-eval,2452.70064,False,0.0,False,2452.70064 +52705aba-dec6-4cae-8008-119f574f53d3,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-differential-cryptanalysis,22209,21382,43591,1818.796497,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-differential-cryptanalysis,1818.796497,False,0.0,False,1818.796497 +73adb208-b1e7-4021-b87a-e97fb65d926b,gemini-2.5-pro,gemini,break-filter-js-from-html,4867,5974,10841,1206.644112,False,0.0,gemini-2.5-pro,break-filter-js-from-html,1206.644112,False,0.2,False,1206.644112 +d8feae3f-17d0-4624-8fd9-36ef162a809e,grok-4-0709,xai,constraints-scheduling,3291,1260,4551,483.826994,True,1.0,grok-4-0709,constraints-scheduling,483.826994,True,0.8,True,483.826994 +b6be878c-b1ce-4536-9327-b321767ea855,grok-4-0709,xai,make-mips-interpreter,16256,19424,35680,2057.934995,False,0.0,grok-4-0709,make-mips-interpreter,2057.934995,False,0.0,False,2057.934995 +0e55ca86-932f-43b9-ad0b-00f1030783d1,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-with-gcov,10791,2277,13068,170.473386,True,1.0,deepseek-ai/DeepSeek-V3.1,sqlite-with-gcov,170.473386,True,0.8,True,170.473386 +bd2b3632-1ec9-4cef-87c6-b88e2d37e711,claude-opus-4-1-20250805,anthropic,build-pmars,10259,2865,13124,600.126326,False,0.0,claude-opus-4-1-20250805,build-pmars,600.126326,False,0.5,False,600.126326 +a588cf8c-0309-462a-9867-e86db0eda599,grok-4-0709,xai,filter-js-from-html,1305,1593,2898,409.077527,False,0.0,grok-4-0709,filter-js-from-html,409.077527,False,0.0,False,409.077527 +ba5ef0d0-e8f9-4a83-85ff-aade6ba0db51,gemini-2.5-flash,gemini,feal-differential-cryptanalysis,2666,24336,27002,290.39154,False,0.0,gemini-2.5-flash,feal-differential-cryptanalysis,290.39154,False,0.2,False,290.39154 +f1f5dcc5-d51f-4329-a76f-96a55c9e3015,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,bn-fit-modify,41610,15322,56932,3600.457142,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,bn-fit-modify,3600.457142,False,0.0,False,3600.457142 +3fb7cd02-0166-4f4a-bd68-e2fbf9807944,gpt-5-mini,openai,build-pov-ray,12579,41312,53891,6000.014509,False,0.0,gpt-5-mini,build-pov-ray,6000.014509,False,0.0,False,6000.014509 +0af79210-dbc6-4ee7-a82a-a5dcea7a7c45,gpt-5,openai,pypi-server,4249,1827,6076,183.053019,False,0.0,gpt-5,pypi-server,183.053019,False,0.3333333333333333,False,183.053019 +b7afad3d-dd86-4ed6-b18a-414d587b9270,claude-opus-4-1-20250805,anthropic,mteb-retrieve,2196,1529,3725,388.133686,False,0.0,claude-opus-4-1-20250805,mteb-retrieve,388.133686,False,0.0,False,388.133686 +422e1882-413a-4e65-b8e1-81fd9ac2859c,gpt-5,openai,bn-fit-modify,12191,12249,24440,1151.545079,False,0.0,gpt-5,bn-fit-modify,1151.545079,False,0.5,False,1151.545079 +d9ff0f91-4bd3-4746-bf1e-e9f733eea15b,grok-code-fast-1,xai,db-wal-recovery,3461,3795,7256,490.638608,False,0.0,grok-code-fast-1,db-wal-recovery,490.638608,False,0.0,False,490.638608 +c5ca9c96-de52-4df6-8361-616a2058f7a0,gpt-5,openai,model-extraction-relu-logits,6580,5283,11863,316.262251,False,0.0,gpt-5,model-extraction-relu-logits,316.262251,False,0.1666666666666666,False,316.262251 +302db4c2-6813-490a-9546-a2cb644b3cc7,gemini-2.5-flash,gemini,feal-linear-cryptanalysis,11439,28211,39650,1800.879325,False,0.0,gemini-2.5-flash,feal-linear-cryptanalysis,1800.879325,False,0.0,False,1800.879325 +d5e5a5fe-4d0c-4a57-bc27-01c1f63e65bb,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,hf-model-inference,4416,2193,6609,178.737748,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,hf-model-inference,178.737748,False,0.8,False,178.737748 +734e9b56-2e9d-4c27-9af3-318675ed0f80,claude-sonnet-4-20250514,anthropic,financial-document-processor,5429,4186,9615,1230.753223,False,0.0,claude-sonnet-4-20250514,financial-document-processor,1230.753223,False,0.2,False,1230.753223 +4028c47b-3410-4e57-83d1-4af1ff19dccc,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing,5066,5066,10132,1031.468274,False,0.0,deepseek-ai/DeepSeek-V3.1,path-tracing,1031.468274,False,0.0,False,1031.468274 +3b2d1976-9460-496c-a928-0049485853db,claude-opus-4-1-20250805,anthropic,install-windows-3.11,11406,13494,24900,3645.10536,False,0.0,claude-opus-4-1-20250805,install-windows-3.11,3645.10536,False,0.0,False,3645.10536 +d99ac1e3-8197-4b2e-9f6e-6e1054dc5490,deepseek-ai/DeepSeek-V3.1,together_ai,adaptive-rejection-sampler,12582,11156,23738,909.159333,False,0.0,deepseek-ai/DeepSeek-V3.1,adaptive-rejection-sampler,909.159333,False,0.2,False,909.159333 +2da8398c-fb0c-4380-bf10-200891b839b1,openai/gpt-oss-120b,together_ai,chess-best-move,9531,5808,15339,805.521973,False,0.0,openai/gpt-oss-120b,chess-best-move,805.521973,False,0.0,False,805.521973 +72545f41-4ed1-423b-86b1-e54954e7c83a,grok-4-0709,xai,large-scale-text-editing,1711,866,2577,341.078518,True,1.0,grok-4-0709,large-scale-text-editing,341.078518,True,0.4,True,341.078518 +5c84767c-a92b-4372-96f7-214d4101cb79,gpt-5-mini,openai,pytorch-model-cli,1580,1525,3105,178.311842,False,0.0,gpt-5-mini,pytorch-model-cli,178.311842,False,0.0,False,178.311842 +86039e9d-c8a4-4d01-b5a0-09f5cb93f03a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-c-py,7854,5653,13507,910.368116,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-c-py,910.368116,False,0.0,False,910.368116 +02ebafac-a700-42de-a694-c404cc486503,openai/gpt-oss-120b,together_ai,train-fasttext,22257,12675,34932,3601.413439,False,0.0,openai/gpt-oss-120b,train-fasttext,3601.413439,False,0.0,False,3601.413439 +cba087b9-c691-428c-bb32-5aa41cb92bfb,claude-opus-4-1-20250805,anthropic,port-compressor,55728,36577,92305,3600.001374,False,0.0,claude-opus-4-1-20250805,port-compressor,3600.001374,False,0.0,False,3600.001374 +2adabc36-17a7-42b8-903f-ca3a71fd34bf,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-c-py,21194,16776,37970,904.145887,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-c-py,904.145887,False,0.0,False,904.145887 +746adf2b-cdb4-4707-87c7-4414b106809f,claude-sonnet-4-20250514,anthropic,largest-eigenval,10130,8399,18529,846.486256,False,0.0,claude-sonnet-4-20250514,largest-eigenval,846.486256,False,0.0,False,846.486256 +2a273648-a6f4-41dc-bc0c-52077b1c0f78,deepseek-ai/DeepSeek-V3.1,together_ai,adaptive-rejection-sampler,13228,7352,20580,900.006481,True,1.0,deepseek-ai/DeepSeek-V3.1,adaptive-rejection-sampler,900.006481,True,0.2,True,900.006481 +5083f31c-15fc-4147-99e1-0b02bd57079d,OpenAI/gpt-oss-20B,together_ai,openssl-selfsigned-cert,1859,1163,3022,53.614372,False,0.0,OpenAI/gpt-oss-20B,openssl-selfsigned-cert,53.614372,False,0.2,False,53.614372 +97f8c84c-cef9-46e9-9ddb-95d815169c38,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,extract-elf,5199,1634,6833,242.698079,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,extract-elf,242.698079,False,0.0,False,242.698079 +c938f063-6418-4386-88ff-f6cd39264402,claude-sonnet-4-20250514,anthropic,wasm-pipeline,12230,4930,17160,408.234483,True,1.0,claude-sonnet-4-20250514,wasm-pipeline,408.234483,True,0.6,True,408.234483 +2712bc11-7a50-4d3a-b1d8-32791b653c89,zai-org/GLM-4.5-Air-FP8,together_ai,prove-plus-comm,4845,7107,11952,712.82138,True,1.0,zai-org/GLM-4.5-Air-FP8,prove-plus-comm,712.82138,True,0.8,True,712.82138 +9ac5dae9-28fe-4097-a195-b100e6eeff70,gpt-5-nano,openai,feal-linear-cryptanalysis,26243,38300,64543,1814.425211,False,0.0,gpt-5-nano,feal-linear-cryptanalysis,1814.425211,False,0.0,False,1814.425211 +e32e39ef-8b5f-44f0-a7c7-b3909cb7dde8,gemini-2.5-flash,gemini,log-summary-date-ranges,6698,3052,9750,210.464959,False,0.0,gemini-2.5-flash,log-summary-date-ranges,210.464959,False,0.0,False,210.464959 +f77f28fb-a961-40c6-8b27-8f86b2401dc3,moonshotai/Kimi-K2-Instruct-0905,together_ai,crack-7z-hash,9109,3496,12605,309.726764,True,1.0,moonshotai/Kimi-K2-Instruct-0905,crack-7z-hash,309.726764,True,1.0,True,309.726764 +3bef001b-8719-4e2b-bdab-3d73d3557b26,grok-4-0709,xai,build-pov-ray,22223,7529,29752,2279.359497,True,1.0,grok-4-0709,build-pov-ray,2279.359497,True,1.0,True,2279.359497 +54892a94-1dbb-489e-9334-0b5731df9907,zai-org/GLM-4.5-Air-FP8,together_ai,model-extraction-relu-logits,12851,9126,21977,505.36828,False,0.0,zai-org/GLM-4.5-Air-FP8,model-extraction-relu-logits,505.36828,False,0.2,False,505.36828 +5945d0c2-36de-4049-9a35-b2b880dbc9d1,grok-4-0709,xai,qemu-alpine-ssh,1796,1709,3505,557.619939,False,0.0,grok-4-0709,qemu-alpine-ssh,557.619939,False,0.0,False,557.619939 +6b36c97b-3559-4a3e-970e-5956fc28f34c,grok-4-0709,xai,regex-log,1238,508,1746,267.028883,True,1.0,grok-4-0709,regex-log,267.028883,True,0.6,True,267.028883 +9868a0db-11cd-4002-86ba-816516162219,gpt-5,openai,model-extraction-relu-logits,11881,6505,18386,777.806328,False,0.0,gpt-5,model-extraction-relu-logits,777.806328,False,0.1666666666666666,False,777.806328 +dae4de34-7533-4679-a3ac-ffe6810d6ec6,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-db-truncate,7261,7044,14305,394.126657,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-db-truncate,394.126657,False,0.0,False,394.126657 +0335bd61-ed5b-43a8-a41c-782f7dd20693,deepseek-ai/DeepSeek-V3.1,together_ai,git-leak-recovery,2551,1891,4442,177.017306,False,0.0,deepseek-ai/DeepSeek-V3.1,git-leak-recovery,177.017306,False,0.6,False,177.017306 +49807970-2d2e-430d-af9d-6ac04e0cc593,gpt-5-nano,openai,code-from-image,1203,797,2000,69.547031,False,0.0,gpt-5-nano,code-from-image,69.547031,False,0.0,False,69.547031 +8d8c0b1a-fe79-4119-8d90-d66b3fb99ba3,gemini-2.5-flash,gemini,reshard-c4-data,3159,4122,7281,228.45223,False,0.0,gemini-2.5-flash,reshard-c4-data,228.45223,False,0.0,False,228.45223 +d42b7534-4973-449d-ac23-2c662367124f,OpenAI/gpt-oss-20B,together_ai,cobol-modernization,1541,1824,3365,920.936867,False,0.0,OpenAI/gpt-oss-20B,cobol-modernization,920.936867,False,0.0,False,920.936867 +aa6f7e7e-5074-43b9-89ec-24775f66a5be,claude-opus-4-1-20250805,anthropic,build-initramfs-qemu,0,0,0,1765.657198,False,0.0,claude-opus-4-1-20250805,build-initramfs-qemu,1765.657198,False,0.0,False,1765.657198 +2c0bcaaa-4797-40c9-81ec-13da7993c33b,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-db-truncate,3455,3544,6999,276.167985,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-db-truncate,276.167985,False,0.0,False,276.167985 +4395387f-8a44-4a67-b87c-42431ef0d2ec,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,crack-7z-hash,3116,1849,4965,104.553058,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,crack-7z-hash,104.553058,False,0.0,False,104.553058 +9ae134e3-a91f-440b-aa91-0d0561414b56,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-insert,16605,2014,18619,360.018043,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-insert,360.018043,False,0.0,False,360.018043 +4eb1ef79-211b-4759-bada-10520d7582f4,gemini-2.5-flash,gemini,count-dataset-tokens,5087,4329,9416,912.516773,False,0.0,gemini-2.5-flash,count-dataset-tokens,912.516773,False,0.0,False,912.516773 +ebfc759b-138b-41f5-922f-7599feafce91,grok-code-fast-1,xai,install-windows-3.11,8748,3285,12033,852.042047,False,0.0,grok-code-fast-1,install-windows-3.11,852.042047,False,0.0,False,852.042047 +070a75ab-bf12-4028-9cee-7a0533583ecc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,circuit-fibsqrt,7093,7119,14212,1145.888043,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,circuit-fibsqrt,1145.888043,False,0.0,False,1145.888043 +d87a57cb-03bc-4e85-a348-bebe3b803185,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-ocaml-gc,40240,16449,56689,1420.513525,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-ocaml-gc,1420.513525,False,0.0,False,1420.513525 +6cdf559f-952b-46e7-8a4e-8980da5280da,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,bn-fit-modify,19828,12828,32656,1325.061114,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,bn-fit-modify,1325.061114,False,0.0,False,1325.061114 +25234113-072e-4896-ae82-43e0cb6fb206,zai-org/GLM-4.5-Air-FP8,together_ai,largest-eigenval,8935,8258,17193,900.562171,False,0.0,zai-org/GLM-4.5-Air-FP8,largest-eigenval,900.562171,False,0.0,False,900.562171 +2d198eab-ffa2-4c5e-acdb-dd520cfe1b59,grok-code-fast-1,xai,merge-diff-arc-agi-task,8345,2733,11078,223.598911,True,1.0,grok-code-fast-1,merge-diff-arc-agi-task,223.598911,True,0.8,True,223.598911 +d5a94c8b-374e-4719-96ce-8a6c3677d366,gemini-2.5-pro,gemini,filter-js-from-html,2461,1866,4327,135.518955,False,0.0,gemini-2.5-pro,filter-js-from-html,135.518955,False,0.0,False,135.518955 +b95e474b-cf55-46d9-a8e2-c858dd3424b6,openai/gpt-oss-120b,together_ai,cancel-async-tasks,1448,612,2060,50.402216,False,0.0,openai/gpt-oss-120b,cancel-async-tasks,50.402216,False,0.6,False,50.402216 +6bde58e3-f9f7-43e5-aec1-c40e9777c281,gpt-5-nano,openai,feal-differential-cryptanalysis,2529,1715,4244,98.026569,False,0.0,gpt-5-nano,feal-differential-cryptanalysis,98.026569,False,0.0,False,98.026569 +9d1bc831-2e1a-4400-8e2e-e86ff75330c0,openai/gpt-oss-120b,together_ai,sanitize-git-repo,9455,3966,13421,529.431522,False,0.0,openai/gpt-oss-120b,sanitize-git-repo,529.431522,False,0.0,False,529.431522 +1e6ede1b-47b4-4d13-b977-ed246071e37a,moonshotai/Kimi-K2-Instruct-0905,together_ai,merge-diff-arc-agi-task,22245,13219,35464,889.530768,False,0.0,moonshotai/Kimi-K2-Instruct-0905,merge-diff-arc-agi-task,889.530768,False,0.0,False,889.530768 +9a169b9a-0014-4d0f-bf94-17e4a4da08cd,gemini-2.5-flash,gemini,filter-js-from-html,2013,7562,9575,406.952729,False,0.0,gemini-2.5-flash,filter-js-from-html,406.952729,False,0.0,False,406.952729 +dde43d64-6bfe-40c1-89fc-37ec7520a2bb,gpt-5,openai,run-pdp11-code,2991,2361,5352,1013.657169,False,0.0,gpt-5,run-pdp11-code,1013.657169,False,0.0,False,1013.657169 +9cae2e44-2d01-4ea0-9678-ab5f90087f6c,claude-sonnet-4-20250514,anthropic,install-windows-3.11,10576,5083,15659,349.848141,False,0.0,claude-sonnet-4-20250514,install-windows-3.11,349.848141,False,0.0,False,349.848141 +7f2a3c75-8849-4a30-85e1-4f2b58c10622,gpt-5,openai,form-filling,8227,10992,19219,579.442688,True,1.0,gpt-5,form-filling,579.442688,True,0.8,True,579.442688 +c4d862d2-0938-4e03-b418-e0a34b632590,openai/gpt-oss-120b,together_ai,install-windows-3.11,4762,772,5534,99.331575,False,0.0,openai/gpt-oss-120b,install-windows-3.11,99.331575,False,0.0,False,99.331575 +0c0eb696-3be6-4d9e-b476-f1ced16e7bbb,gpt-5-mini,openai,password-recovery,8114,5908,14022,900.010141,False,0.0,gpt-5-mini,password-recovery,900.010141,False,0.0,False,900.010141 +a4cbeb86-4009-4b86-90d9-4f15d5fe82d9,gpt-5-mini,openai,log-summary-date-ranges,5739,2454,8193,128.262776,False,0.0,gpt-5-mini,log-summary-date-ranges,128.262776,False,0.0,False,128.262776 +6120b5c2-4af1-439f-8b55-45de899d7236,openai/gpt-oss-120b,together_ai,extract-elf,2349,1651,4000,286.513563,True,1.0,openai/gpt-oss-120b,extract-elf,286.513563,True,0.4,True,286.513563 +bf5b9ab7-080c-4c78-93ec-76e703a888e1,claude-opus-4-1-20250805,anthropic,count-dataset-tokens,6588,2620,9208,480.764525,False,0.0,claude-opus-4-1-20250805,count-dataset-tokens,480.764525,False,0.0,False,480.764525 +6f281982-0af3-430a-90be-ec525345663c,OpenAI/gpt-oss-20B,together_ai,reshard-c4-data,1810,1860,3670,56.930466,False,0.0,OpenAI/gpt-oss-20B,reshard-c4-data,56.930466,False,0.0,False,56.930466 +6140b0e4-d434-46ba-951c-06e778d13652,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-git,1724,946,2670,140.804019,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-git,140.804019,False,0.0,False,140.804019 +f11d05cb-fa50-4280-809c-79d3486cc1bb,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,adaptive-rejection-sampler,13729,7527,21256,920.723752,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,adaptive-rejection-sampler,920.723752,False,0.0,False,920.723752 +946d672b-2327-4949-a23c-f8ea8e92b420,zai-org/GLM-4.5-Air-FP8,together_ai,make-mips-interpreter,25750,20301,46051,1683.325587,False,0.0,zai-org/GLM-4.5-Air-FP8,make-mips-interpreter,1683.325587,False,0.0,False,1683.325587 +150b4736-4bf4-4e87-826c-154a6b2cdfd2,grok-code-fast-1,xai,hf-model-inference,4015,894,4909,134.600098,True,1.0,grok-code-fast-1,hf-model-inference,134.600098,True,0.4,True,134.600098 +531a69fd-6fd5-4be4-93f4-5b947121cf1e,gemini-2.5-flash,gemini,install-klee-minimal,20431,8561,28992,900.124814,False,0.0,gemini-2.5-flash,install-klee-minimal,900.124814,False,0.0,False,900.124814 +59bdc1c2-acd2-4f71-be3a-1c07605eabf0,gpt-5-mini,openai,write-compressor,2916,1159,4075,111.409613,False,0.0,gpt-5-mini,write-compressor,111.409613,False,0.0,False,111.409613 +a400b2a4-a299-4ace-a818-7b63b51d5b64,moonshotai/Kimi-K2-Instruct-0905,together_ai,hf-model-inference,6912,4311,11223,453.037159,False,0.0,moonshotai/Kimi-K2-Instruct-0905,hf-model-inference,453.037159,False,0.0,False,453.037159 +ea4eb20d-cead-4887-8ab6-af9ebb140d1e,grok-code-fast-1,xai,constraints-scheduling,2861,2999,5860,147.825986,True,1.0,grok-code-fast-1,constraints-scheduling,147.825986,True,0.8,True,147.825986 +b1329b7c-a036-496d-aa49-f73af5b23cce,gpt-5,openai,log-summary-date-ranges,5498,1430,6928,56.137735,False,0.0,gpt-5,log-summary-date-ranges,56.137735,False,0.0,False,56.137735 +dba4d961-5275-4b10-8f2e-c025a6d4c7bc,grok-4-0709,xai,build-cython-ext,18922,4639,23561,910.697525,False,0.0,grok-4-0709,build-cython-ext,910.697525,False,0.0,False,910.697525 +cb876c41-2dab-45b9-8c43-39d015a984bc,zai-org/GLM-4.5-Air-FP8,together_ai,reverse-engineering,18177,15897,34074,2104.729972,False,0.0,zai-org/GLM-4.5-Air-FP8,reverse-engineering,2104.729972,False,0.0,False,2104.729972 +e22a08e7-22a6-464e-a8f3-7d687b8ec7bc,OpenAI/gpt-oss-20B,together_ai,run-pdp11-code,1047,610,1657,192.493951,False,0.0,OpenAI/gpt-oss-20B,run-pdp11-code,192.493951,False,0.0,False,192.493951 +f2829ebc-d8a0-4a5b-8eb7-46e0bf85a454,gemini-2.5-pro,gemini,adaptive-rejection-sampler,8678,7329,16007,917.26487,True,1.0,gemini-2.5-pro,adaptive-rejection-sampler,917.26487,True,0.4,True,917.26487 +69895dee-1d12-4a7a-860d-48edc587ac27,gpt-5-mini,openai,log-summary-date-ranges,2806,1766,4572,73.332209,False,0.0,gpt-5-mini,log-summary-date-ranges,73.332209,False,0.0,False,73.332209 +a5c7c2f4-f26e-426f-aa1e-117ca5e40f48,claude-sonnet-4-20250514,anthropic,reshard-c4-data,8444,6634,15078,1835.648696,False,0.0,claude-sonnet-4-20250514,reshard-c4-data,1835.648696,False,0.0,False,1835.648696 +fad47282-aed6-492d-8fdb-729409bae839,OpenAI/gpt-oss-20B,together_ai,run-pdp11-code,3736,13765,17501,1002.170458,False,0.0,OpenAI/gpt-oss-20B,run-pdp11-code,1002.170458,False,0.0,False,1002.170458 +2eed3e80-a10d-427b-8494-014fc040b093,zai-org/GLM-4.5-Air-FP8,together_ai,gpt2-codegolf,6013,6670,12683,302.317268,False,0.0,zai-org/GLM-4.5-Air-FP8,gpt2-codegolf,302.317268,False,0.0,False,302.317268 +ddfd4110-01a6-41a0-83d1-26bea4615157,grok-4-0709,xai,fix-code-vulnerability,1580,249,1829,947.287169,False,0.0,grok-4-0709,fix-code-vulnerability,947.287169,False,0.2,False,947.287169 +74a1c787-b60d-44c2-b35a-41783a7b5cda,grok-4-0709,xai,count-dataset-tokens,10975,2290,13265,904.26028,False,0.0,grok-4-0709,count-dataset-tokens,904.26028,False,0.0,False,904.26028 +e5ef1524-6e3b-4942-86a2-39bbb2b0813c,claude-opus-4-1-20250805,anthropic,db-wal-recovery,7192,5902,13094,249.388615,False,0.0,claude-opus-4-1-20250805,db-wal-recovery,249.388615,False,0.0,False,249.388615 +895598b7-5163-4e78-b72e-9114e94faeac,deepseek-ai/DeepSeek-V3.1,together_ai,train-fasttext,23439,8695,32134,2501.538762,False,0.0,deepseek-ai/DeepSeek-V3.1,train-fasttext,2501.538762,False,0.0,False,2501.538762 +08622f25-0d54-4aea-b380-6b7dab1d94f0,OpenAI/gpt-oss-20B,together_ai,largest-eigenval,283,1106,1389,45.439537,False,0.0,OpenAI/gpt-oss-20B,largest-eigenval,45.439537,False,0.0,False,45.439537 +168c4f60-c6b6-4160-afab-1d4ea1590c75,openai/gpt-oss-120b,together_ai,feal-differential-cryptanalysis,2124,993,3117,289.170768,False,0.0,openai/gpt-oss-120b,feal-differential-cryptanalysis,289.170768,False,0.0,False,289.170768 +5bc41dd8-6f5b-4e9d-abb2-eed152f2acb2,gpt-5,openai,tune-mjcf,9221,5477,14698,963.670652,False,0.0,gpt-5,tune-mjcf,963.670652,False,0.0,False,963.670652 +72a03d34-a27c-4f1c-a23d-606c3ba778d8,grok-code-fast-1,xai,build-cython-ext,19421,7114,26535,480.811365,False,0.0,grok-code-fast-1,build-cython-ext,480.811365,False,0.0,False,480.811365 +3550fb97-b4ff-4154-b1d1-303a3983cf81,deepseek-ai/DeepSeek-V3.1,together_ai,cobol-modernization,19692,17969,37661,915.748719,True,1.0,deepseek-ai/DeepSeek-V3.1,cobol-modernization,915.748719,True,0.6,True,915.748719 +e45353e4-e3b0-4389-a617-843ac953c8c7,OpenAI/gpt-oss-20B,together_ai,gpt2-codegolf,2077,3766,5843,210.674505,False,0.0,OpenAI/gpt-oss-20B,gpt2-codegolf,210.674505,False,0.0,False,210.674505 +6ab0dc44-7332-4d0a-96f6-975bed736d10,OpenAI/gpt-oss-20B,together_ai,torch-tensor-parallelism,2034,1816,3850,72.891641,False,0.0,OpenAI/gpt-oss-20B,torch-tensor-parallelism,72.891641,False,0.0,False,72.891641 +a57502a1-ff23-4bcb-bc69-6f7fc14f6158,zai-org/GLM-4.5-Air-FP8,together_ai,dna-assembly,16608,5878,22486,738.761843,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-assembly,738.761843,False,0.0,False,738.761843 +fabc7c4d-ebe9-41ca-a53a-679445d95a55,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-code-vulnerability,10147,5351,15498,900.248602,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-code-vulnerability,900.248602,False,0.4,False,900.248602 +d55842c3-4000-4d30-9d39-1ed8c8ae39b2,claude-sonnet-4-20250514,anthropic,train-fasttext,28801,14169,42970,3647.624007,False,0.0,claude-sonnet-4-20250514,train-fasttext,3647.624007,False,0.0,False,3647.624007 +f758b943-1fb6-47f0-8f1d-5a206c158839,openai/gpt-oss-120b,together_ai,chess-best-move,7257,10418,17675,902.75813,False,0.0,openai/gpt-oss-120b,chess-best-move,902.75813,False,0.0,False,902.75813 +f342cf95-6730-4acf-9f29-c4f95bbfe419,gemini-2.5-flash,gemini,pypi-server,22201,9789,31990,902.599329,False,0.0,gemini-2.5-flash,pypi-server,902.599329,False,0.0,False,902.599329 +dcaa9baa-73d6-40fe-b124-3382093504da,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-alpine-ssh,3527,4525,8052,1045.194376,False,0.0,deepseek-ai/DeepSeek-V3.1,qemu-alpine-ssh,1045.194376,False,0.2,False,1045.194376 +e5c32866-2596-4e0a-8412-b2baf48c4f6e,deepseek-ai/DeepSeek-V3.1,together_ai,financial-document-processor,9190,4592,13782,307.804841,False,0.0,deepseek-ai/DeepSeek-V3.1,financial-document-processor,307.804841,False,0.0,False,307.804841 +5292ba24-b51f-4f30-8994-7e01ce27d17d,grok-4-0709,xai,reverse-engineering,7750,4223,11973,777.174587,True,1.0,grok-4-0709,reverse-engineering,777.174587,True,0.2,True,777.174587 +4e8f60c0-b75a-4f48-9b67-1db360c1a653,claude-opus-4-1-20250805,anthropic,configure-git-webserver,6424,1854,8278,549.973132,True,1.0,claude-opus-4-1-20250805,configure-git-webserver,549.973132,True,0.625,True,549.973132 +b841f96f-063c-44c6-a480-10e4f6fadbfb,gpt-5-mini,openai,financial-document-processor,3886,4354,8240,187.002199,False,0.0,gpt-5-mini,financial-document-processor,187.002199,False,0.0,False,187.002199 +41f19d9b-0fc9-4c01-be8d-a4d61e45585b,zai-org/GLM-4.5-Air-FP8,together_ai,count-dataset-tokens,11166,4563,15729,588.420629,False,0.0,zai-org/GLM-4.5-Air-FP8,count-dataset-tokens,588.420629,False,0.0,False,588.420629 +eb1600dc-eb83-4359-b7c3-4838da522f94,gpt-5-mini,openai,break-filter-js-from-html,2541,1317,3858,175.414401,False,0.0,gpt-5-mini,break-filter-js-from-html,175.414401,False,0.0,False,175.414401 +63680ddc-5269-4de2-a3b7-edd9d8395acd,zai-org/GLM-4.5-Air-FP8,together_ai,sparql-university,6200,3479,9679,152.513995,False,0.0,zai-org/GLM-4.5-Air-FP8,sparql-university,152.513995,False,0.0,False,152.513995 +2bd7a599-7fc6-40b9-8a6e-7248ce4fe12b,gpt-5-nano,openai,chess-best-move,7417,6746,14163,901.981711,False,0.0,gpt-5-nano,chess-best-move,901.981711,False,0.0,False,901.981711 +3ccd2fb7-1823-4cd0-ae9e-4154268de659,grok-code-fast-1,xai,fix-ocaml-gc,15911,3971,19882,798.084791,False,0.0,grok-code-fast-1,fix-ocaml-gc,798.084791,False,0.0,False,798.084791 +7d4e9777-04ea-4eab-8112-37b33c3434ac,moonshotai/Kimi-K2-Instruct-0905,together_ai,feal-linear-cryptanalysis,20057,18078,38135,1810.122203,False,0.0,moonshotai/Kimi-K2-Instruct-0905,feal-linear-cryptanalysis,1810.122203,False,0.0,False,1810.122203 +771c770a-515c-4d1a-aa52-fc23621d9917,gpt-5,openai,fix-git,3652,1907,5559,152.242485,True,1.0,gpt-5,fix-git,152.242485,True,1.0,True,152.242485 +48fc6838-ce69-4495-bff7-21cf134d6c6a,gemini-2.5-pro,gemini,cobol-modernization,5612,3610,9222,420.1549,True,1.0,gemini-2.5-pro,cobol-modernization,420.1549,True,1.0,True,420.1549 +49b5b975-45b9-4de9-b40b-918804413fd0,grok-4-0709,xai,chess-best-move,4160,2994,7154,902.5297,False,0.0,grok-4-0709,chess-best-move,902.5297,False,0.0,False,902.5297 +f1657e05-45a0-4369-a05d-10b4c50dcdb3,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-ocaml-gc,24777,8586,33363,801.922854,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-ocaml-gc,801.922854,False,0.0,False,801.922854 +fd017dcc-4847-4433-8af4-9d825bb8dfb5,claude-sonnet-4-20250514,anthropic,install-klee-minimal,11349,2114,13463,900.292791,False,0.0,claude-sonnet-4-20250514,install-klee-minimal,900.292791,False,0.0,False,900.292791 +b94ba249-e720-483c-b322-88a76474fb89,gemini-2.5-pro,gemini,constraints-scheduling,4431,3187,7618,299.170936,True,1.0,gemini-2.5-pro,constraints-scheduling,299.170936,True,1.0,True,299.170936 +6ceb5cbf-90a1-49ca-bee5-b7467d963fd9,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,train-fasttext,10599,3989,14588,507.799676,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,train-fasttext,507.799676,False,0.0,False,507.799676 +fee3a8fd-bfb6-4f94-bf0a-22c7d4f76eb6,gpt-5,openai,break-filter-js-from-html,2920,1411,4331,563.454374,False,0.0,gpt-5,break-filter-js-from-html,563.454374,False,0.4285714285714285,False,563.454374 +ed818932-8618-4b31-8753-c3eaadd6f6c8,gpt-5-nano,openai,write-compressor,21944,11116,33060,900.240016,False,0.0,gpt-5-nano,write-compressor,900.240016,False,0.0,False,900.240016 +997ab650-31c3-47a2-9643-fe7eae37a508,OpenAI/gpt-oss-20B,together_ai,train-fasttext,1854,855,2709,252.774943,False,0.0,OpenAI/gpt-oss-20B,train-fasttext,252.774943,False,0.0,False,252.774943 +fa39bd03-bb5d-445a-aa3d-1313fd1e4ab4,deepseek-ai/DeepSeek-V3.1,together_ai,regex-log,1957,1582,3539,136.612886,False,0.0,deepseek-ai/DeepSeek-V3.1,regex-log,136.612886,False,0.2,False,136.612886 +f0358f4e-e4b3-4de8-bd5b-4404898f0a95,OpenAI/gpt-oss-20B,together_ai,winning-avg-corewars,358,684,1042,57.29964,False,0.0,OpenAI/gpt-oss-20B,winning-avg-corewars,57.29964,False,0.0,False,57.29964 +7ea72d4f-78c9-4030-a7fb-47eadf1a88f5,grok-4-0709,xai,hf-model-inference,4100,1055,5155,422.673379,True,1.0,grok-4-0709,hf-model-inference,422.673379,True,1.0,True,422.673379 +830c98de-9701-40c2-8c5a-0b6b04617d5b,openai/gpt-oss-120b,together_ai,mteb-retrieve,1811,1143,2954,107.016436,False,0.0,openai/gpt-oss-120b,mteb-retrieve,107.016436,False,0.0,False,107.016436 +14206059-cb45-4e40-a1b7-b55478198a4a,gpt-5-mini,openai,path-tracing-reverse,36486,27819,64305,1803.244462,False,0.0,gpt-5-mini,path-tracing-reverse,1803.244462,False,0.0,False,1803.244462 +c7280f12-74ed-48cd-a12b-83b016181e59,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,distribution-search,15993,16668,32661,1526.148199,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,distribution-search,1526.148199,False,0.4,False,1526.148199 +21bd5aa3-4449-4842-860c-992f1226eebc,gemini-2.5-flash,gemini,polyglot-rust-c,1409,1757,3166,905.820841,False,0.0,gemini-2.5-flash,polyglot-rust-c,905.820841,False,0.0,False,905.820841 +c85b9247-8a5c-44dc-be6e-1e560f079900,openai/gpt-oss-120b,together_ai,fix-git,5373,1930,7303,136.63619,True,1.0,openai/gpt-oss-120b,fix-git,136.63619,True,0.6,True,136.63619 +eb80e1a1-98a1-4476-9428-199df528a4ee,deepseek-ai/DeepSeek-V3.1,together_ai,break-filter-js-from-html,9058,13305,22363,1252.880764,False,0.0,deepseek-ai/DeepSeek-V3.1,break-filter-js-from-html,1252.880764,False,0.0,False,1252.880764 +2bdb9791-14df-4b86-8d4b-31cc305586b4,deepseek-ai/DeepSeek-V3.1,together_ai,nginx-request-logging,6966,3588,10554,516.587813,True,1.0,deepseek-ai/DeepSeek-V3.1,nginx-request-logging,516.587813,True,0.4,True,516.587813 +58af97cc-c69e-4149-ac6b-7bc71db7a0e1,grok-4-0709,xai,pytorch-model-cli,12696,7102,19798,900.494879,False,0.0,grok-4-0709,pytorch-model-cli,900.494879,False,0.6,False,900.494879 +220c858b-cb47-45b1-82b2-8ce0ea90e450,gemini-2.5-pro,gemini,pytorch-model-cli,17895,5756,23651,900.00787,True,1.0,gemini-2.5-pro,pytorch-model-cli,900.00787,True,0.4,True,900.00787 +25b4e369-a625-4567-8011-07a293e34937,claude-sonnet-4-20250514,anthropic,form-filling,9238,7236,16474,423.387936,True,1.0,claude-sonnet-4-20250514,form-filling,423.387936,True,1.0,True,423.387936 +39f86d6b-ac6e-485f-ab7c-d5a2198be334,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,regex-log,2518,2318,4836,169.47116,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,regex-log,169.47116,False,0.2,False,169.47116 +c6777baf-6c7c-46b2-adf0-0fbd828de527,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,openssl-selfsigned-cert,3972,2908,6880,415.117961,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,openssl-selfsigned-cert,415.117961,False,0.4,False,415.117961 +7ad021cf-1982-4b5d-b60f-b91981a835b0,gpt-5-nano,openai,gpt2-codegolf,9340,8573,17913,949.044162,False,0.0,gpt-5-nano,gpt2-codegolf,949.044162,False,0.0,False,949.044162 +afa51c2f-fa37-46ce-9d2f-6f132d35cf87,gemini-2.5-pro,gemini,circuit-fibsqrt,9315,7532,16847,747.144993,False,0.0,gemini-2.5-pro,circuit-fibsqrt,747.144993,False,0.0,False,747.144993 +c4d1cce3-76f9-4e3e-b409-156261d2c435,openai/gpt-oss-120b,together_ai,sanitize-git-repo,3398,1848,5246,226.641051,False,0.0,openai/gpt-oss-120b,sanitize-git-repo,226.641051,False,0.0,False,226.641051 +8fbbaa08-b3b9-4621-a646-91e8e6ff4818,claude-sonnet-4-20250514,anthropic,db-wal-recovery,6889,7828,14717,941.266466,False,0.0,claude-sonnet-4-20250514,db-wal-recovery,941.266466,False,0.0,False,941.266466 +0a6c2940-b35f-40b9-813d-e2adc824a2de,openai/gpt-oss-120b,together_ai,torch-tensor-parallelism,2177,2775,4952,53.688934,False,0.0,openai/gpt-oss-120b,torch-tensor-parallelism,53.688934,False,0.0,False,53.688934 +e759cfc1-86cb-4398-b354-11a6460c0214,gpt-5,openai,distribution-search,2958,2127,5085,148.92117,True,1.0,gpt-5,distribution-search,148.92117,True,1.0,True,148.92117 +fd92f0a3-1a06-4d73-9dac-df1cbc970f50,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,hf-model-inference,7642,3404,11046,582.349791,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,hf-model-inference,582.349791,False,0.0,False,582.349791 +5bf64581-bc7d-4cf2-bf1e-7bf347d7791e,claude-sonnet-4-20250514,anthropic,port-compressor,39742,21534,61276,3609.163831,False,0.0,claude-sonnet-4-20250514,port-compressor,3609.163831,False,0.2,False,3609.163831 +fac03630-83fa-4994-9021-15a0789c8dbd,OpenAI/gpt-oss-20B,together_ai,cobol-modernization,3942,13263,17205,914.934667,False,0.0,OpenAI/gpt-oss-20B,cobol-modernization,914.934667,False,0.0,False,914.934667 +7fb74be7-02ce-495e-937a-880c7970e775,OpenAI/gpt-oss-20B,together_ai,schemelike-metacircular-eval,294,495,789,83.828158,False,0.0,OpenAI/gpt-oss-20B,schemelike-metacircular-eval,83.828158,False,0.0,False,83.828158 +17d25f0b-4f3a-4708-8f4d-65e7b6572e9d,gemini-2.5-pro,gemini,build-pov-ray,16005,6427,22432,1015.919214,True,1.0,gemini-2.5-pro,build-pov-ray,1015.919214,True,1.0,True,1015.919214 +dc9c0b1f-74a0-49e0-83b2-94fcfcc437b1,grok-code-fast-1,xai,log-summary-date-ranges,9221,6740,15961,192.412587,False,0.0,grok-code-fast-1,log-summary-date-ranges,192.412587,False,0.0,False,192.412587 +356654b7-3186-41b4-be12-aad910568747,OpenAI/gpt-oss-20B,together_ai,schemelike-metacircular-eval,607,1244,1851,110.064861,False,0.0,OpenAI/gpt-oss-20B,schemelike-metacircular-eval,110.064861,False,0.0,False,110.064861 +1f705936-1ea7-4b1d-9c72-a1d7e9412b14,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing,51200,8513,59713,575.254942,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing,575.254942,False,0.0,False,575.254942 +18ace2db-d5cf-4c41-b48e-075548cb28ab,gemini-2.5-flash,gemini,torch-tensor-parallelism,1936,2791,4727,67.658286,False,0.0,gemini-2.5-flash,torch-tensor-parallelism,67.658286,False,0.0,False,67.658286 +edd375ed-ded0-4f7a-abdc-4974e03c75f5,gemini-2.5-pro,gemini,form-filling,4119,4393,8512,248.176906,False,0.0,gemini-2.5-pro,form-filling,248.176906,False,0.2,False,248.176906 +eede16e8-4c38-492c-80f5-4aeb09f8ebae,gemini-2.5-pro,gemini,git-leak-recovery,1995,1271,3266,143.796337,True,1.0,gemini-2.5-pro,git-leak-recovery,143.796337,True,1.0,True,143.796337 +d2e9a14d-4ba2-46a7-bff2-cc494246c169,gemini-2.5-flash,gemini,constraints-scheduling,22065,18029,40094,1211.78287,True,1.0,gemini-2.5-flash,constraints-scheduling,1211.78287,True,0.4,True,1211.78287 +0a7f9ad3-831b-4a14-8f78-33ea4e35e2b1,gemini-2.5-flash,gemini,filter-js-from-html,3336,2614,5950,210.840016,False,0.0,gemini-2.5-flash,filter-js-from-html,210.840016,False,0.0,False,210.840016 +9f55c0ed-f20b-4bae-91ab-a2ba8b618778,OpenAI/gpt-oss-20B,together_ai,regex-log,1210,721,1931,66.696215,False,0.0,OpenAI/gpt-oss-20B,regex-log,66.696215,False,0.0,False,66.696215 +01dc8b2d-4901-4e46-b50d-ae6b98b67060,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,crack-7z-hash,8627,2327,10954,390.560703,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,crack-7z-hash,390.560703,False,0.0,False,390.560703 +aa6079f2-f1b2-48a5-8024-89d587a1d1d8,openai/gpt-oss-120b,together_ai,largest-eigenval,9838,10222,20060,900.004603,False,0.0,openai/gpt-oss-120b,largest-eigenval,900.004603,False,0.0,False,900.004603 +488e2534-e402-4199-a97d-8430240bca4d,claude-opus-4-1-20250805,anthropic,model-extraction-relu-logits,3147,2105,5252,156.784934,False,0.0,claude-opus-4-1-20250805,model-extraction-relu-logits,156.784934,False,0.0,False,156.784934 +e5439a3f-7ba5-4a25-8513-891bb22a313c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing-reverse,7402,6917,14319,949.059229,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing-reverse,949.059229,False,0.0,False,949.059229 +8ca02970-58fa-48fd-893c-1b13f2a64207,zai-org/GLM-4.5-Air-FP8,together_ai,pypi-server,16111,9013,25124,789.345523,False,0.0,zai-org/GLM-4.5-Air-FP8,pypi-server,789.345523,False,0.2,False,789.345523 +856f3eec-9478-46d7-be29-a42a2b5e8f6d,grok-code-fast-1,xai,write-compressor,3578,2354,5932,206.184307,False,0.0,grok-code-fast-1,write-compressor,206.184307,False,0.0,False,206.184307 +07cf8898-1be8-405e-a40a-2297b5ac347c,deepseek-ai/DeepSeek-V3.1,together_ai,torch-tensor-parallelism,2448,1505,3953,97.884612,False,0.0,deepseek-ai/DeepSeek-V3.1,torch-tensor-parallelism,97.884612,False,0.0,False,97.884612 +a5bb7d2d-09d8-47ad-a00c-aca600518a72,grok-code-fast-1,xai,sparql-university,4866,1735,6601,90.451081,False,0.0,grok-code-fast-1,sparql-university,90.451081,False,0.2,False,90.451081 +66844dda-35e6-4e87-9251-260e0f8f9339,gpt-5-mini,openai,build-pov-ray,11487,4121,15608,960.79387,False,0.0,gpt-5-mini,build-pov-ray,960.79387,False,0.0,False,960.79387 +5e8c653c-38b7-4ccd-981e-0b5df6419bbd,claude-opus-4-1-20250805,anthropic,reshard-c4-data,9924,9549,19473,900.005734,False,0.0,claude-opus-4-1-20250805,reshard-c4-data,900.005734,False,0.0,False,900.005734 +2ac3e485-450e-4946-9fef-22661df31e00,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-klee-minimal,18777,2934,21711,905.783931,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-klee-minimal,905.783931,False,0.0,False,905.783931 +1b61a5c5-37e0-4ade-b668-98b94419791d,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,financial-document-processor,3752,2995,6747,255.456439,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,financial-document-processor,255.456439,False,0.0,False,255.456439 +89d03271-11f3-40b7-8652-7811c87c74f8,gpt-5,openai,crack-7z-hash,10070,4716,14786,868.820394,True,1.0,gpt-5,crack-7z-hash,868.820394,True,0.4285714285714285,True,868.820394 +70f05a09-70ae-4d8d-969e-aeee76119580,gpt-5-mini,openai,mteb-retrieve,5092,3720,8812,628.823794,False,0.0,gpt-5-mini,mteb-retrieve,628.823794,False,0.0,False,628.823794 +caec024e-5e88-4670-a6b6-5ba5cfcfa517,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reshard-c4-data,8086,6183,14269,901.364213,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reshard-c4-data,901.364213,False,0.0,False,901.364213 +2aa8a679-658b-481a-b262-42fdea09d8ed,moonshotai/Kimi-K2-Instruct-0905,together_ai,model-extraction-relu-logits,4613,4665,9278,486.902523,False,0.0,moonshotai/Kimi-K2-Instruct-0905,model-extraction-relu-logits,486.902523,False,0.4,False,486.902523 +a8a4cbe5-c513-4402-8427-f59e35c9f280,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,run-pdp11-code,11337,5323,16660,557.633957,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,run-pdp11-code,557.633957,False,0.0,False,557.633957 +84c9fd73-fc0e-4aad-ace9-3c4a7c491674,gemini-2.5-flash,gemini,openssl-selfsigned-cert,2505,2352,4857,161.431979,False,0.0,gemini-2.5-flash,openssl-selfsigned-cert,161.431979,False,0.0,False,161.431979 +01d61d98-bce0-42cd-b01f-43b334645d7d,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pov-ray,32257,18222,50479,3782.790563,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pov-ray,3782.790563,False,0.0,False,3782.790563 +c68de3c6-c698-4e36-8317-9be7d35d104b,gpt-5,openai,path-tracing-reverse,11799,23742,35541,1800.000693,False,0.0,gpt-5,path-tracing-reverse,1800.000693,False,0.0,False,1800.000693 +eb17ff62-d0fd-49e6-820a-4a012b4ef4f2,gpt-5,openai,dna-insert,5003,5541,10544,360.001225,False,0.0,gpt-5,dna-insert,360.001225,False,0.0,False,360.001225 +053bb4d5-419c-493c-8d7b-974a4ff377e2,gpt-5-nano,openai,count-dataset-tokens,9154,6285,15439,900.696784,False,0.0,gpt-5-nano,count-dataset-tokens,900.696784,False,0.0,False,900.696784 +b5c0108f-7418-4fc4-a254-6e23d6f39a15,OpenAI/gpt-oss-20B,together_ai,path-tracing-reverse,597,2819,3416,313.094215,False,0.0,OpenAI/gpt-oss-20B,path-tracing-reverse,313.094215,False,0.0,False,313.094215 +607d1c62-afed-4ec5-83a5-958125d43a67,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-leaderboard,21765,6458,28223,545.52535,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-leaderboard,545.52535,False,0.0,False,545.52535 +80e5171d-2f59-4b46-911f-51567c16e20a,deepseek-ai/DeepSeek-V3.1,together_ai,large-scale-text-editing,4688,5075,9763,646.635553,False,0.0,deepseek-ai/DeepSeek-V3.1,large-scale-text-editing,646.635553,False,0.0,False,646.635553 +5d1e7eb3-5bdd-4a30-b678-91776bc0907b,claude-opus-4-1-20250805,anthropic,merge-diff-arc-agi-task,16085,6142,22227,265.488601,False,0.0,claude-opus-4-1-20250805,merge-diff-arc-agi-task,265.488601,False,0.3333333333333333,False,265.488601 +8f1b0971-ef33-4ec6-9412-552af16195cd,grok-code-fast-1,xai,build-pmars,11050,2826,13876,783.378833,True,1.0,grok-code-fast-1,build-pmars,783.378833,True,0.8,True,783.378833 +14c1c7df-3daf-428f-a914-42f56c86f865,OpenAI/gpt-oss-20B,together_ai,mteb-retrieve,1461,1190,2651,149.596764,False,0.0,OpenAI/gpt-oss-20B,mteb-retrieve,149.596764,False,0.0,False,149.596764 +6819fe3a-fbc7-45f0-8b81-63d3d6d092b6,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-startup,1523,863,2386,137.037577,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-startup,137.037577,True,0.4,True,137.037577 +e1ad5434-ef3e-4d1b-a619-2a1b1b7a347f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,run-pdp11-code,3950,4211,8161,1037.034821,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,run-pdp11-code,1037.034821,False,0.0,False,1037.034821 +693b5606-46c3-4bfa-affc-812af6d44357,claude-opus-4-1-20250805,anthropic,wasm-pipeline,9784,5103,14887,900.002479,False,0.0,claude-opus-4-1-20250805,wasm-pipeline,900.002479,False,0.1428571428571428,False,900.002479 +15d28e88-e51c-4aa6-b41f-bc09a440a57f,grok-code-fast-1,xai,break-filter-js-from-html,4903,5002,9905,796.159249,False,0.0,grok-code-fast-1,break-filter-js-from-html,796.159249,False,0.0,False,796.159249 +f931da19-2f56-4f8e-8f56-dc173a1ddd4a,gpt-5,openai,make-doom-for-mips,8575,8978,17553,900.000973,False,0.0,gpt-5,make-doom-for-mips,900.000973,False,0.0,False,900.000973 +55c63350-ca20-495f-8913-fd1456b1b903,claude-opus-4-1-20250805,anthropic,path-tracing-reverse,25807,19392,45199,1839.759531,False,0.0,claude-opus-4-1-20250805,path-tracing-reverse,1839.759531,False,0.0,False,1839.759531 +81e72b55-e7d9-4231-975e-f88995ed20bb,gpt-5-nano,openai,merge-diff-arc-agi-task,10555,8238,18793,517.514929,False,0.0,gpt-5-nano,merge-diff-arc-agi-task,517.514929,False,0.2,False,517.514929 +965c1989-f3ea-442d-84dc-ef826bf10709,gpt-5,openai,polyglot-rust-c,858,919,1777,900.113803,False,0.0,gpt-5,polyglot-rust-c,900.113803,False,0.0,False,900.113803 +2c8bf95a-102c-4572-8010-c3898129d7c6,claude-sonnet-4-20250514,anthropic,sparql-university,9747,6504,16251,884.868928,False,0.0,claude-sonnet-4-20250514,sparql-university,884.868928,False,0.0,False,884.868928 +ff50a638-2941-4063-a70e-5fc0e5508c2b,gemini-2.5-flash,gemini,bn-fit-modify,26404,23894,50298,3600.651741,False,0.0,gemini-2.5-flash,bn-fit-modify,3600.651741,False,0.0,False,3600.651741 +6840746f-28b9-47b8-b048-240080d9a164,grok-4-0709,xai,build-pov-ray,17398,4786,22184,1030.578869,True,1.0,grok-4-0709,build-pov-ray,1030.578869,True,1.0,True,1030.578869 +549c552d-4def-4ae6-a614-5f7d5988febb,gemini-2.5-pro,gemini,count-dataset-tokens,15836,3411,19247,902.980624,False,0.0,gemini-2.5-pro,count-dataset-tokens,902.980624,False,0.0,False,902.980624 +9a13732f-f64a-4144-98b2-86de1cf7d49d,zai-org/GLM-4.5-Air-FP8,together_ai,log-summary-date-ranges,2651,2436,5087,99.454935,True,1.0,zai-org/GLM-4.5-Air-FP8,log-summary-date-ranges,99.454935,True,0.8,True,99.454935 +39e7cc9c-87a2-456e-877e-823d6b7a57c5,claude-opus-4-1-20250805,anthropic,polyglot-c-py,2208,1619,3827,138.02483,False,0.0,claude-opus-4-1-20250805,polyglot-c-py,138.02483,False,0.0,False,138.02483 +6f35d2a2-4ad5-4fe6-b0e2-22f99e24418f,grok-4-0709,xai,write-compressor,1456,592,2048,903.095772,False,0.0,grok-4-0709,write-compressor,903.095772,False,0.0,False,903.095772 +609a4dbc-cc97-47a3-984d-f1ab42be02e1,openai/gpt-oss-120b,together_ai,large-scale-text-editing,6550,11466,18016,1228.576369,False,0.0,openai/gpt-oss-120b,large-scale-text-editing,1228.576369,False,0.0,False,1228.576369 +4ea25959-ffb9-4bd7-881e-b9fdf873a331,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,regex-log,2049,2841,4890,253.577828,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,regex-log,253.577828,False,0.2,False,253.577828 +c9e92c24-2d05-4b52-9314-5ab7406e0b9d,claude-opus-4-1-20250805,anthropic,gpt2-codegolf,24553,18554,43107,907.131468,False,0.0,claude-opus-4-1-20250805,gpt2-codegolf,907.131468,False,0.0,False,907.131468 +2443e660-db36-4114-9128-f562d8b33d02,claude-opus-4-1-20250805,anthropic,mteb-leaderboard,13880,5924,19804,405.67755,False,0.0,claude-opus-4-1-20250805,mteb-leaderboard,405.67755,False,0.0,False,405.67755 +e7590a6a-2c16-4cf1-8cdb-6579359fd3c0,claude-sonnet-4-20250514,anthropic,git-leak-recovery,3389,2968,6357,242.261075,True,1.0,claude-sonnet-4-20250514,git-leak-recovery,242.261075,True,1.0,True,242.261075 +718c8f43-e58f-40f1-b70b-c3e87a262142,deepseek-ai/DeepSeek-V3.1,together_ai,regex-log,2881,2192,5073,123.500391,True,1.0,deepseek-ai/DeepSeek-V3.1,regex-log,123.500391,True,0.2,True,123.500391 +a1b7e64c-a453-4ced-bbc3-b487f50beb48,OpenAI/gpt-oss-20B,together_ai,path-tracing-reverse,3430,10449,13879,933.841408,False,0.0,OpenAI/gpt-oss-20B,path-tracing-reverse,933.841408,False,0.0,False,933.841408 +404d5ee1-69e0-4edb-aa19-be0318d96bc8,claude-opus-4-1-20250805,anthropic,build-pmars,12739,3225,15964,240.389111,True,1.0,claude-opus-4-1-20250805,build-pmars,240.389111,True,0.5,True,240.389111 +498db6da-5bf1-43c2-9e3c-dad13471a78b,grok-code-fast-1,xai,qemu-alpine-ssh,1216,1052,2268,126.480546,False,0.0,grok-code-fast-1,qemu-alpine-ssh,126.480546,False,0.0,False,126.480546 +1de69a71-f848-469d-8298-eb18cde45f23,grok-4-0709,xai,qemu-alpine-ssh,974,544,1518,960.69337,False,0.0,grok-4-0709,qemu-alpine-ssh,960.69337,False,0.0,False,960.69337 +c6deceed-6bc5-4ad7-b6dc-8e3fc4237632,claude-opus-4-1-20250805,anthropic,mteb-leaderboard,10243,8327,18570,894.546868,False,0.0,claude-opus-4-1-20250805,mteb-leaderboard,894.546868,False,0.0,False,894.546868 +c4f52e70-fda2-4b9a-ac50-f213cb82c082,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-retrieve,2535,2601,5136,102.981173,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-retrieve,102.981173,False,0.0,False,102.981173 +25824a37-eb61-493c-b671-4bb34c65278f,gpt-5,openai,circuit-fibsqrt,19252,60810,80062,3631.903935,False,0.0,gpt-5,circuit-fibsqrt,3631.903935,False,0.6666666666666666,False,3631.903935 +3366ff69-5908-47e2-be01-e1c302821e48,claude-opus-4-1-20250805,anthropic,winning-avg-corewars,5389,2273,7662,242.722011,True,1.0,claude-opus-4-1-20250805,winning-avg-corewars,242.722011,True,0.3333333333333333,True,242.722011 +5edce7e8-72f1-4666-838d-e83094cf8e6a,gemini-2.5-pro,gemini,write-compressor,10962,10103,21065,920.16247,False,0.0,gemini-2.5-pro,write-compressor,920.16247,False,0.0,False,920.16247 +1e021ab3-4b9f-4499-bba0-935090590c39,gemini-2.5-flash,gemini,constraints-scheduling,3819,4179,7998,446.132755,False,0.0,gemini-2.5-flash,constraints-scheduling,446.132755,False,0.4,False,446.132755 +09364e83-3dd8-4e19-97db-8ddc3dd21e60,openai/gpt-oss-120b,together_ai,tune-mjcf,9076,5522,14598,707.803744,True,1.0,openai/gpt-oss-120b,tune-mjcf,707.803744,True,0.2,True,707.803744 +bd872ef7-223c-41c5-b1db-1ffc0197c52b,claude-opus-4-1-20250805,anthropic,constraints-scheduling,5599,3912,9511,533.379048,False,0.0,claude-opus-4-1-20250805,constraints-scheduling,533.379048,False,0.8888888888888888,False,533.379048 +e7b5c0c1-5e6a-4637-a7a6-ca4c7cbfbf5b,gpt-5-mini,openai,schemelike-metacircular-eval,23734,34064,57798,2413.828432,False,0.0,gpt-5-mini,schemelike-metacircular-eval,2413.828432,False,0.0,False,2413.828432 +e5adf4b0-6cf2-4dde-ab9e-9b4f751a65be,gemini-2.5-pro,gemini,mteb-leaderboard,29457,13507,42964,1546.836951,False,0.0,gemini-2.5-pro,mteb-leaderboard,1546.836951,False,0.0,False,1546.836951 +7c56abc1-3133-4715-80bf-bc250963e9cd,grok-code-fast-1,xai,fix-ocaml-gc,25638,8594,34232,1973.564711,False,0.0,grok-code-fast-1,fix-ocaml-gc,1973.564711,False,0.0,False,1973.564711 +3c41ab80-d074-481a-b65a-626587d4a050,gpt-5-mini,openai,qemu-alpine-ssh,1998,1707,3705,304.586518,False,0.0,gpt-5-mini,qemu-alpine-ssh,304.586518,False,0.0,False,304.586518 +09b42e7f-972f-4e3c-b529-d8ec69fbf33a,claude-opus-4-1-20250805,anthropic,feal-differential-cryptanalysis,22480,20743,43223,1801.241135,False,0.0,claude-opus-4-1-20250805,feal-differential-cryptanalysis,1801.241135,False,0.0,False,1801.241135 +5efce481-8c38-4bb4-be18-543903df2a89,gemini-2.5-pro,gemini,sparql-university,3019,1709,4728,113.766223,False,0.0,gemini-2.5-pro,sparql-university,113.766223,False,0.6,False,113.766223 +e034aa30-7135-4787-94ed-a2b9a686e080,openai/gpt-oss-120b,together_ai,fix-code-vulnerability,13705,8949,22654,904.445221,False,0.0,openai/gpt-oss-120b,fix-code-vulnerability,904.445221,False,0.0,False,904.445221 +eb815c04-79f6-4e3c-97fd-73f163437195,gpt-5,openai,bn-fit-modify,13585,14448,28033,663.819466,False,0.0,gpt-5,bn-fit-modify,663.819466,False,0.5,False,663.819466 +dda1c072-c77e-4d2a-acfa-24412c369a3f,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-leaderboard,15444,3833,19277,506.521827,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-leaderboard,506.521827,False,0.0,False,506.521827 +dfa56d12-ef6f-4e49-b7bc-c49bb609d8ee,claude-opus-4-1-20250805,anthropic,schemelike-metacircular-eval,12695,9526,22221,2402.266617,False,0.0,claude-opus-4-1-20250805,schemelike-metacircular-eval,2402.266617,False,0.0,False,2402.266617 +36561de2-0b6f-4cf4-b168-8d295dc546c0,grok-4-0709,xai,pypi-server,2047,665,2712,249.580629,False,0.0,grok-4-0709,pypi-server,249.580629,False,0.4,False,249.580629 +a54a7151-0004-4aa8-b5cc-9f0706a355cd,gpt-5-nano,openai,mteb-retrieve,4770,3090,7860,309.128176,False,0.0,gpt-5-nano,mteb-retrieve,309.128176,False,0.0,False,309.128176 +7700b12c-dfe8-4f41-93b9-64581dd40a6f,zai-org/GLM-4.5-Air-FP8,together_ai,adaptive-rejection-sampler,12658,12306,24964,900.549711,False,0.0,zai-org/GLM-4.5-Air-FP8,adaptive-rejection-sampler,900.549711,False,0.0,False,900.549711 +b5b86ea0-4e39-4879-a44f-cad92cb4158f,claude-opus-4-1-20250805,anthropic,vulnerable-secret,2484,2143,4627,78.871735,True,1.0,claude-opus-4-1-20250805,vulnerable-secret,78.871735,True,0.625,True,78.871735 +1e19fede-14d5-46ad-9041-adf5936b595e,gpt-5-mini,openai,install-windows-3.11,9880,7449,17329,618.915039,False,0.0,gpt-5-mini,install-windows-3.11,618.915039,False,0.0,False,618.915039 +13f6237b-93f8-40d3-a761-a1a272cc7eb2,grok-code-fast-1,xai,qemu-alpine-ssh,2375,2999,5374,438.084797,False,0.0,grok-code-fast-1,qemu-alpine-ssh,438.084797,False,0.0,False,438.084797 +d774b13d-faa4-4d06-80c3-755b99d54104,gemini-2.5-flash,gemini,cobol-modernization,3738,12602,16340,900.71718,False,0.0,gemini-2.5-flash,cobol-modernization,900.71718,False,0.2,False,900.71718 +9214016a-12d3-47ad-903a-53708eea5210,moonshotai/Kimi-K2-Instruct-0905,together_ai,run-pdp11-code,8294,7353,15647,1006.292308,False,0.0,moonshotai/Kimi-K2-Instruct-0905,run-pdp11-code,1006.292308,False,0.0,False,1006.292308 +d9614988-4b95-4409-a8e0-9345e439c5a3,deepseek-ai/DeepSeek-V3.1,together_ai,build-pov-ray,31536,32950,64486,6213.433423,False,0.0,deepseek-ai/DeepSeek-V3.1,build-pov-ray,6213.433423,False,0.4,False,6213.433423 +7ad260af-21cf-4f97-9c8d-962491daeebe,gpt-5-mini,openai,make-doom-for-mips,3237,3401,6638,903.196624,False,0.0,gpt-5-mini,make-doom-for-mips,903.196624,False,0.0,False,903.196624 +96ce99b7-bb4e-4d7b-9751-80b65d681237,grok-4-0709,xai,run-pdp11-code,3276,2125,5401,1002.96926,False,0.0,grok-4-0709,run-pdp11-code,1002.96926,False,0.0,False,1002.96926 +a0bd8ecd-2a8c-4df5-a7c3-b103ee62aff2,claude-opus-4-1-20250805,anthropic,schemelike-metacircular-eval,41229,34399,75628,2430.843741,False,0.0,claude-opus-4-1-20250805,schemelike-metacircular-eval,2430.843741,False,0.0,False,2430.843741 +001b8ead-4a37-47e4-9737-34ca951949fb,gpt-5-mini,openai,path-tracing-reverse,29313,23555,52868,1810.15497,False,0.0,gpt-5-mini,path-tracing-reverse,1810.15497,False,0.0,False,1810.15497 +e549c06c-2316-4319-b788-471d31311f92,OpenAI/gpt-oss-20B,together_ai,pypi-server,1079,2635,3714,190.194728,False,0.0,OpenAI/gpt-oss-20B,pypi-server,190.194728,False,0.2,False,190.194728 +f784c58f-84c6-4a24-ae6e-7010412fa287,OpenAI/gpt-oss-20B,together_ai,video-processing,168,1718,1886,99.775747,False,0.0,OpenAI/gpt-oss-20B,video-processing,99.775747,False,0.0,False,99.775747 +1faee519-791d-436a-931e-d27ea1245c0f,zai-org/GLM-4.5-Air-FP8,together_ai,build-pmars,17297,8916,26213,904.272271,False,0.0,zai-org/GLM-4.5-Air-FP8,build-pmars,904.272271,False,0.6,False,904.272271 +8172a25e-7b9b-4e90-b167-592f75300151,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-ocaml-gc,53219,23946,77165,2332.50221,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-ocaml-gc,2332.50221,False,0.0,False,2332.50221 +8db0f589-2478-4fc8-8ef9-019ec342543d,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-c-py,19107,11996,31103,901.604527,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-c-py,901.604527,False,0.0,False,901.604527 +8c3d5cd8-aac7-4e83-9b54-944eba57d818,gemini-2.5-flash,gemini,mteb-leaderboard,962,447,1409,78.655178,False,0.0,gemini-2.5-flash,mteb-leaderboard,78.655178,False,0.0,False,78.655178 +4de09ee5-4ae9-449a-9d06-264f3f435c83,claude-opus-4-1-20250805,anthropic,bn-fit-modify,14087,5810,19897,429.705317,True,1.0,claude-opus-4-1-20250805,bn-fit-modify,429.705317,True,0.875,True,429.705317 +8fcb3879-147c-4629-9b41-e6ceaa3e8e95,claude-opus-4-1-20250805,anthropic,openssl-selfsigned-cert,4918,3738,8656,682.712621,True,1.0,claude-opus-4-1-20250805,openssl-selfsigned-cert,682.712621,True,1.0,True,682.712621 +6a506db4-fff4-4ef8-91e8-f75521b0f3f0,claude-opus-4-1-20250805,anthropic,prove-plus-comm,2082,1254,3336,116.805302,True,1.0,claude-opus-4-1-20250805,prove-plus-comm,116.805302,True,1.0,True,116.805302 +4c43f87a-b358-47e7-8530-b94836e99819,gemini-2.5-flash,gemini,extract-elf,1271,1135,2406,117.742669,False,0.0,gemini-2.5-flash,extract-elf,117.742669,False,0.4,False,117.742669 +cab09fd3-8155-49eb-8a7c-415df5bb7f3c,gpt-5,openai,password-recovery,4844,4032,8876,900.427213,False,0.0,gpt-5,password-recovery,900.427213,False,0.0,False,900.427213 +49f7029c-e89a-4ab8-9912-20cff8f06eee,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,reverse-engineering,2675,2779,5454,330.294595,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reverse-engineering,330.294595,False,0.0,False,330.294595 +649303d3-19fd-4c73-8be9-9b7b59c5856c,gpt-5-mini,openai,constraints-scheduling,4310,3583,7893,279.480295,True,1.0,gpt-5-mini,constraints-scheduling,279.480295,True,0.8,True,279.480295 +e12a173d-734f-46f5-8240-9491a4017210,claude-sonnet-4-20250514,anthropic,write-compressor,10883,13353,24236,900.945399,False,0.0,claude-sonnet-4-20250514,write-compressor,900.945399,False,0.0,False,900.945399 +b5792fa5-773f-4f70-bb74-19e2997a75e1,grok-code-fast-1,xai,financial-document-processor,5809,1781,7590,83.73838,False,0.0,grok-code-fast-1,financial-document-processor,83.73838,False,0.0,False,83.73838 +3eae4e47-31ee-4938-88ec-495b1e16a3ee,deepseek-ai/DeepSeek-V3.1,together_ai,bn-fit-modify,8000,4230,12230,257.77484,False,0.0,deepseek-ai/DeepSeek-V3.1,bn-fit-modify,257.77484,False,0.0,False,257.77484 +cee3d65f-9bd2-4b70-bb24-0a6d7ecd589b,claude-opus-4-1-20250805,anthropic,reverse-engineering,14990,8044,23034,2612.21751,False,0.0,claude-opus-4-1-20250805,reverse-engineering,2612.21751,False,0.0,False,2612.21751 +c1f3506c-df21-44ee-bf83-b74b63d60fcf,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,break-filter-js-from-html,2709,2659,5368,509.872238,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,break-filter-js-from-html,509.872238,False,0.0,False,509.872238 +4d8de6e7-5262-4ea5-8498-ef980d13e314,gpt-5,openai,polyglot-c-py,1694,1104,2798,215.933267,False,0.0,gpt-5,polyglot-c-py,215.933267,False,0.0,False,215.933267 +8207d8eb-e02b-407a-9c27-68fb53223489,gemini-2.5-pro,gemini,configure-git-webserver,5040,1007,6047,228.676898,False,0.0,gemini-2.5-pro,configure-git-webserver,228.676898,False,0.0,False,228.676898 +86465dc4-c277-474b-abad-8aecd61bc1c8,gemini-2.5-pro,gemini,dna-assembly,6561,7404,13965,434.661754,False,0.0,gemini-2.5-pro,dna-assembly,434.661754,False,0.0,False,434.661754 +050f40b6-f8fc-4f0b-a599-8c4aced4d44a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-c-py,4310,3408,7718,193.214625,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-c-py,193.214625,False,0.0,False,193.214625 +9d0be9a1-0b68-4a59-8733-3d9a723d6d7b,grok-4-0709,xai,torch-tensor-parallelism,1574,826,2400,182.975585,False,0.0,grok-4-0709,torch-tensor-parallelism,182.975585,False,0.0,False,182.975585 +129b4526-38e0-42a6-a364-4abe3c127d28,claude-opus-4-1-20250805,anthropic,tune-mjcf,21285,18772,40057,900.009322,False,0.0,claude-opus-4-1-20250805,tune-mjcf,900.009322,False,0.25,False,900.009322 +bb53acdd-4535-4c63-bcbc-affdf4a87c43,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,tune-mjcf,10327,7882,18209,905.38447,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,tune-mjcf,905.38447,False,0.0,False,905.38447 +24cb400d-b6db-4242-9329-4229e85f85ba,gpt-5-mini,openai,mteb-retrieve,6711,5434,12145,412.934795,False,0.0,gpt-5-mini,mteb-retrieve,412.934795,False,0.0,False,412.934795 +c07652f4-dd0c-43b6-80d7-a6ce535b2d15,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,largest-eigenval,2990,2323,5313,907.211007,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,largest-eigenval,907.211007,False,0.0,False,907.211007 +a961976c-4b1d-47ce-94b6-60c5aa5f2359,gemini-2.5-flash,gemini,fix-ocaml-gc,36050,33861,69911,3600.488881,False,0.0,gemini-2.5-flash,fix-ocaml-gc,3600.488881,False,0.0,False,3600.488881 +69454a0b-f518-4501-b003-ba26d9981629,gemini-2.5-pro,gemini,sanitize-git-repo,8783,1697,10480,268.295875,False,0.0,gemini-2.5-pro,sanitize-git-repo,268.295875,False,0.0,False,268.295875 +1a487bbd-b3f1-4fd6-9ce6-0f4ec59624ac,claude-sonnet-4-20250514,anthropic,run-pdp11-code,12646,5582,18228,1039.243392,False,0.0,claude-sonnet-4-20250514,run-pdp11-code,1039.243392,False,0.0,False,1039.243392 +3a94e965-6fa6-4572-970c-102b67228bba,gemini-2.5-flash,gemini,dna-insert,6169,19886,26055,628.360897,False,0.0,gemini-2.5-flash,dna-insert,628.360897,False,0.0,False,628.360897 +ed5dd1f2-c3cd-4031-9f8d-461afecd1352,gemini-2.5-flash,gemini,build-cython-ext,21129,9004,30133,900.239173,False,0.0,gemini-2.5-flash,build-cython-ext,900.239173,False,0.0,False,900.239173 +45085700-60c5-4a1d-bccc-c26635c6d474,claude-opus-4-1-20250805,anthropic,video-processing,3302,2515,5817,162.099751,False,0.0,claude-opus-4-1-20250805,video-processing,162.099751,False,0.0,False,162.099751 +61d922bf-544a-4720-9433-f866f23d622b,openai/gpt-oss-120b,together_ai,mteb-leaderboard,930,301,1231,76.385778,False,0.0,openai/gpt-oss-120b,mteb-leaderboard,76.385778,False,0.0,False,76.385778 +b1e73074-87af-467f-9cf2-d38237429456,gemini-2.5-pro,gemini,path-tracing-reverse,8581,4314,12895,575.791679,False,0.0,gemini-2.5-pro,path-tracing-reverse,575.791679,False,0.0,False,575.791679 +6620592f-7629-4e2a-809f-8a17218f9828,openai/gpt-oss-120b,together_ai,hf-model-inference,3548,1086,4634,136.968838,False,0.0,openai/gpt-oss-120b,hf-model-inference,136.968838,False,0.0,False,136.968838 +43462abe-2444-41c2-a0a7-b4db7b35b726,claude-sonnet-4-20250514,anthropic,polyglot-rust-c,7110,7383,14493,902.534725,False,0.0,claude-sonnet-4-20250514,polyglot-rust-c,902.534725,False,0.0,False,902.534725 +19382d53-a43c-45af-a7e2-20425ce1b2cd,gemini-2.5-flash,gemini,install-klee-minimal,11058,2603,13661,900.155278,False,0.0,gemini-2.5-flash,install-klee-minimal,900.155278,False,0.0,False,900.155278 +3f08affe-15f6-4532-85f2-52ce6e853c29,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,extract-elf,3196,1198,4394,150.776812,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,extract-elf,150.776812,False,0.0,False,150.776812 +ad53aa1f-22d8-4b8d-a25b-89bec1c9a99e,claude-opus-4-1-20250805,anthropic,distribution-search,20360,28293,48653,3600.002506,False,0.0,claude-opus-4-1-20250805,distribution-search,3600.002506,False,0.5555555555555556,False,3600.002506 +47598924-df71-44ac-b3ba-74a78d0feef9,gemini-2.5-pro,gemini,regex-log,1407,818,2225,201.023431,True,1.0,gemini-2.5-pro,regex-log,201.023431,True,0.8,True,201.023431 +fe13e430-f84e-4245-9e5a-8788f0b616bf,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,password-recovery,1602,1994,3596,555.30096,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,password-recovery,555.30096,False,0.0,False,555.30096 +ec1bb383-d44f-4b55-a845-c1ccf8b411fc,claude-opus-4-1-20250805,anthropic,dna-insert,6306,6255,12561,360.000856,False,0.0,claude-opus-4-1-20250805,dna-insert,360.000856,False,0.0,False,360.000856 +804df6d1-a32d-4a0b-a2c9-47338efebf93,gpt-5-nano,openai,tune-mjcf,4163,4861,9024,906.288846,False,0.0,gpt-5-nano,tune-mjcf,906.288846,False,0.0,False,906.288846 +9791aaad-5e69-43a1-8380-d5a05935faa0,grok-4-0709,xai,winning-avg-corewars,14602,15249,29851,3626.878843,False,0.0,grok-4-0709,winning-avg-corewars,3626.878843,False,0.0,False,3626.878843 +c4a902a0-d8a6-4df4-ab3c-2b61f2bea217,gemini-2.5-flash,gemini,regex-log,1395,1840,3235,115.098416,True,1.0,gemini-2.5-flash,regex-log,115.098416,True,0.8,True,115.098416 +eefad2e0-7cd5-4e46-ac53-01536000f05c,claude-opus-4-1-20250805,anthropic,model-extraction-relu-logits,15255,14260,29515,900.009188,False,0.0,claude-opus-4-1-20250805,model-extraction-relu-logits,900.009188,False,0.0,False,900.009188 +ffcd079d-4317-47bd-858e-42585a99765a,gemini-2.5-pro,gemini,constraints-scheduling,3635,2611,6246,524.276474,True,1.0,gemini-2.5-pro,constraints-scheduling,524.276474,True,1.0,True,524.276474 +a1cf1b4c-f1e7-406f-965e-cafebd80f2da,deepseek-ai/DeepSeek-V3.1,together_ai,largest-eigenval,11679,9423,21102,837.504525,False,0.0,deepseek-ai/DeepSeek-V3.1,largest-eigenval,837.504525,False,0.2,False,837.504525 +9f81c2a8-afe9-4a34-94f3-156edd20e0c8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,constraints-scheduling,8790,6469,15259,461.740362,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,constraints-scheduling,461.740362,False,0.0,False,461.740362 +17a43245-37b4-4169-b107-622faa7a3906,OpenAI/gpt-oss-20B,together_ai,vulnerable-secret,1163,2297,3460,70.706258,False,0.0,OpenAI/gpt-oss-20B,vulnerable-secret,70.706258,False,0.0,False,70.706258 +bd5ec0ab-6205-4d82-8744-c6f95775a718,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,vulnerable-secret,12869,2515,15384,506.285393,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,vulnerable-secret,506.285393,True,0.4,True,506.285393 +df359dc5-3a10-4473-8604-e77d0b4a7213,gpt-5-mini,openai,log-summary-date-ranges,2365,2818,5183,94.414215,False,0.0,gpt-5-mini,log-summary-date-ranges,94.414215,False,0.0,False,94.414215 +4ac52660-8dfd-44ee-8788-728c6bae2047,grok-4-0709,xai,torch-tensor-parallelism,1533,1606,3139,558.002263,False,0.0,grok-4-0709,torch-tensor-parallelism,558.002263,False,0.0,False,558.002263 +3adbea08-93ea-4db0-93c1-1d3e809c0cd3,OpenAI/gpt-oss-20B,together_ai,large-scale-text-editing,308,2358,2666,115.260378,False,0.0,OpenAI/gpt-oss-20B,large-scale-text-editing,115.260378,False,0.0,False,115.260378 +b867e9ba-5abd-45e1-bd76-79d5ed8e5285,openai/gpt-oss-120b,together_ai,video-processing,7571,8698,16269,481.845186,False,0.0,openai/gpt-oss-120b,video-processing,481.845186,False,0.0,False,481.845186 +8b40e7e5-2617-4f21-839d-f7db09730e5f,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-retrieve,2893,1936,4829,239.285989,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-retrieve,239.285989,False,0.0,False,239.285989 +cc9477e9-aafe-49de-be3f-7ea47163a9c5,grok-4-0709,xai,crack-7z-hash,8376,4030,12406,735.856104,True,1.0,grok-4-0709,crack-7z-hash,735.856104,True,0.8,True,735.856104 +f5973661-ad82-452f-a89e-0430ac60ffd7,gemini-2.5-pro,gemini,feal-differential-cryptanalysis,2866,2181,5047,477.303108,False,0.0,gemini-2.5-pro,feal-differential-cryptanalysis,477.303108,False,0.6,False,477.303108 +25216d68-52ae-47fb-a886-27d89e4bd382,moonshotai/Kimi-K2-Instruct-0905,together_ai,vulnerable-secret,10998,7475,18473,719.419793,True,1.0,moonshotai/Kimi-K2-Instruct-0905,vulnerable-secret,719.419793,True,0.2,True,719.419793 +667236fa-ea82-4c71-9fd0-ed933c887f36,openai/gpt-oss-120b,together_ai,winning-avg-corewars,17913,19662,37575,1380.136805,False,0.0,openai/gpt-oss-120b,winning-avg-corewars,1380.136805,False,0.5,False,1380.136805 +202f5a30-bc3d-4e59-9c49-d6510a12d1cd,deepseek-ai/DeepSeek-V3.1,together_ai,circuit-fibsqrt,26561,21319,47880,1826.480872,False,0.0,deepseek-ai/DeepSeek-V3.1,circuit-fibsqrt,1826.480872,False,0.0,False,1826.480872 +95bddb5a-2652-4efd-9591-97f7b3514602,gpt-5-nano,openai,pypi-server,13765,7504,21269,761.841603,True,1.0,gpt-5-nano,pypi-server,761.841603,True,0.8,True,761.841603 +e0ebe836-12cd-480e-afe6-70cac4e65ad7,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,bn-fit-modify,35830,10679,46509,1436.95288,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,bn-fit-modify,1436.95288,False,0.0,False,1436.95288 +131933a1-ceb2-4f41-a125-aa0ad45bf861,gpt-5,openai,winning-avg-corewars,18669,15845,34514,2896.633235,True,1.0,gpt-5,winning-avg-corewars,2896.633235,True,0.2857142857142857,True,2896.633235 +584e6f6a-7f25-4bcc-976a-2b6d4f1baeb3,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-initramfs-qemu,7546,7241,14787,552.90485,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-initramfs-qemu,552.90485,False,0.0,False,552.90485 +b806eeac-65bb-4d9f-af81-32a9487409c7,claude-sonnet-4-20250514,anthropic,vulnerable-secret,5191,7850,13041,900.136937,False,0.0,claude-sonnet-4-20250514,vulnerable-secret,900.136937,False,0.0,False,900.136937 +0f07f8aa-5e00-4c24-9503-1de0f62835fd,claude-opus-4-1-20250805,anthropic,largest-eigenval,13662,8500,22162,292.508897,True,1.0,claude-opus-4-1-20250805,largest-eigenval,292.508897,True,0.25,True,292.508897 +e8409ebe-6b1d-44d2-8bdf-d656c602f96e,gpt-5-nano,openai,video-processing,3650,3375,7025,138.731875,False,0.0,gpt-5-nano,video-processing,138.731875,False,0.0,False,138.731875 +1abc30ff-c2e7-419d-9140-77bafb5b886b,OpenAI/gpt-oss-20B,together_ai,polyglot-rust-c,75,734,809,900.017177,False,0.0,OpenAI/gpt-oss-20B,polyglot-rust-c,900.017177,False,0.0,False,900.017177 +856b9854-86c6-45a4-aa4f-0c31c512e1a8,grok-code-fast-1,xai,hf-model-inference,3627,1085,4712,152.852531,True,1.0,grok-code-fast-1,hf-model-inference,152.852531,True,0.4,True,152.852531 +84465b91-466d-4629-90fc-96ac86b42d19,gpt-5,openai,mteb-leaderboard,8637,8122,16759,765.773785,False,0.0,gpt-5,mteb-leaderboard,765.773785,False,0.0,False,765.773785 +1a46f3f1-b9fb-4ebc-b237-591ea5e2c1aa,deepseek-ai/DeepSeek-V3.1,together_ai,schemelike-metacircular-eval,42096,47026,89122,2176.908106,False,0.0,deepseek-ai/DeepSeek-V3.1,schemelike-metacircular-eval,2176.908106,False,0.0,False,2176.908106 +d5a6d572-6933-49c6-ab6a-d2927bb7aca4,grok-code-fast-1,xai,build-initramfs-qemu,1792,1567,3359,45.989782,False,0.0,grok-code-fast-1,build-initramfs-qemu,45.989782,False,0.0,False,45.989782 +0c53e65c-912b-478a-bd1f-fa4d78f3719b,gpt-5,openai,fix-git,3766,1600,5366,137.151731,True,1.0,gpt-5,fix-git,137.151731,True,1.0,True,137.151731 +e538dc23-d30d-455f-a5d0-b9f6f064f353,gemini-2.5-flash,gemini,sparql-university,1082,869,1951,56.828186,False,0.0,gemini-2.5-flash,sparql-university,56.828186,False,0.0,False,56.828186 +f9a8cd6e-4148-4c01-8899-25228c284cba,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,break-filter-js-from-html,1917,1557,3474,197.006478,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,break-filter-js-from-html,197.006478,False,0.0,False,197.006478 +40c0d6f8-4c58-45b2-87be-9a12e33f64f6,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing,10500,11361,21861,1101.284906,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing,1101.284906,False,0.0,False,1101.284906 +879ee685-4c36-49e1-b774-d2e272962dca,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cobol-modernization,14380,14576,28956,915.06147,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cobol-modernization,915.06147,False,0.4,False,915.06147 +bbf9e4c6-c784-487b-b036-dbb5f4b80399,gemini-2.5-pro,gemini,pytorch-model-recovery,4935,3949,8884,910.228245,True,1.0,gemini-2.5-pro,pytorch-model-recovery,910.228245,True,1.0,True,910.228245 +a44da1ed-b12e-4153-b5e1-fdd171eab7ac,grok-4-0709,xai,qemu-startup,1229,1490,2719,1018.743296,True,1.0,grok-4-0709,qemu-startup,1018.743296,True,0.4,True,1018.743296 +4bc89ec1-a3be-490a-81e7-69826af76afe,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-startup,3537,5721,9258,937.207314,True,1.0,moonshotai/Kimi-K2-Instruct-0905,qemu-startup,937.207314,True,0.4,True,937.207314 +ee0b3f4d-5bb5-4cad-b349-1ed614e6cbf0,openai/gpt-oss-120b,together_ai,form-filling,2745,2175,4920,226.702148,False,0.0,openai/gpt-oss-120b,form-filling,226.702148,False,0.6,False,226.702148 +95282df7-782c-4cd6-9a92-0a73ba18dd4b,gpt-5,openai,db-wal-recovery,3509,2117,5626,124.038376,True,1.0,gpt-5,db-wal-recovery,124.038376,True,0.1428571428571428,True,124.038376 +7bdef584-b684-48a4-929e-e59bd6e7b804,gemini-2.5-flash,gemini,chess-best-move,7068,6922,13990,694.564034,False,0.0,gemini-2.5-flash,chess-best-move,694.564034,False,0.0,False,694.564034 +d0738b88-a75e-451b-841c-1e47cd219ac8,grok-code-fast-1,xai,crack-7z-hash,11745,3590,15335,759.74762,True,1.0,grok-code-fast-1,crack-7z-hash,759.74762,True,0.6,True,759.74762 +34523b03-4d0a-4378-a7a5-4bfbfdc0b2cc,zai-org/GLM-4.5-Air-FP8,together_ai,configure-git-webserver,6958,3071,10029,260.746594,False,0.0,zai-org/GLM-4.5-Air-FP8,configure-git-webserver,260.746594,False,0.0,False,260.746594 +ffb28932-018e-4caa-bd35-c5cf59a53122,gpt-5,openai,torch-tensor-parallelism,2932,4399,7331,168.983089,False,0.0,gpt-5,torch-tensor-parallelism,168.983089,False,0.0,False,168.983089 +ec628432-aab1-4922-8169-5e96720b2162,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,nginx-request-logging,5395,4166,9561,212.602059,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,nginx-request-logging,212.602059,False,0.0,False,212.602059 +6970fc53-2bee-4320-86ac-3b03800b481c,grok-4-0709,xai,build-cython-ext,8644,3056,11700,919.754113,False,0.0,grok-4-0709,build-cython-ext,919.754113,False,0.0,False,919.754113 +88a3bb0f-0ea8-46db-9837-30606364e166,zai-org/GLM-4.5-Air-FP8,together_ai,polyglot-c-py,5585,5728,11313,1025.306904,False,0.0,zai-org/GLM-4.5-Air-FP8,polyglot-c-py,1025.306904,False,0.0,False,1025.306904 +cf241e94-fd59-4019-88fd-ebd85e1a36ce,grok-code-fast-1,xai,bn-fit-modify,23472,9776,33248,1394.598372,False,0.0,grok-code-fast-1,bn-fit-modify,1394.598372,False,0.0,False,1394.598372 +60fe1148-64b9-482d-ba72-28b100ebf8ea,grok-code-fast-1,xai,openssl-selfsigned-cert,1776,1107,2883,82.783771,False,0.0,grok-code-fast-1,openssl-selfsigned-cert,82.783771,False,0.2,False,82.783771 +c7c1f375-a11a-44fd-bb85-1ff5485c4f5b,gpt-5,openai,break-filter-js-from-html,3619,2132,5751,615.119177,True,1.0,gpt-5,break-filter-js-from-html,615.119177,True,0.4285714285714285,True,615.119177 +83308219-5470-4a16-9a38-37fa964effc5,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-alpine-ssh,3937,4817,8754,933.500665,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-alpine-ssh,933.500665,False,0.2,False,933.500665 +87832daf-8d14-4806-a704-3530a25daa3b,zai-org/GLM-4.5-Air-FP8,together_ai,build-initramfs-qemu,1633,1974,3607,144.180436,False,0.0,zai-org/GLM-4.5-Air-FP8,build-initramfs-qemu,144.180436,False,0.0,False,144.180436 +5685eabb-5488-422b-b191-19ddcfeeba45,claude-sonnet-4-20250514,anthropic,vulnerable-secret,3253,2262,5515,906.757759,False,0.0,claude-sonnet-4-20250514,vulnerable-secret,906.757759,False,0.0,False,906.757759 +94f6ca4f-80c7-43ae-a8a1-efe58bc63540,gemini-2.5-pro,gemini,install-klee-minimal,11930,2204,14134,900.181155,False,0.0,gemini-2.5-pro,install-klee-minimal,900.181155,False,0.0,False,900.181155 +2701c142-1dc6-4d92-ba86-a37a7a87941e,deepseek-ai/DeepSeek-V3.1,together_ai,feal-differential-cryptanalysis,26046,34069,60115,1800.03677,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-differential-cryptanalysis,1800.03677,False,0.0,False,1800.03677 +773bcf4d-23c0-458c-967e-6e463509bf6e,gpt-5-mini,openai,path-tracing,15673,12172,27845,1100.400333,False,0.0,gpt-5-mini,path-tracing,1100.400333,False,0.0,False,1100.400333 +eda5dfea-e3ea-4ca3-857b-604d9f1b352c,grok-code-fast-1,xai,dna-assembly,5832,1546,7378,138.63623,False,0.0,grok-code-fast-1,dna-assembly,138.63623,False,0.0,False,138.63623 +717bde28-03f3-4aeb-b8b6-13fbc007aec1,zai-org/GLM-4.5-Air-FP8,together_ai,bn-fit-modify,13737,10415,24152,978.36311,False,0.0,zai-org/GLM-4.5-Air-FP8,bn-fit-modify,978.36311,False,0.0,False,978.36311 +5bcf5723-8b8f-46f3-b65b-1ab7c0008e20,zai-org/GLM-4.5-Air-FP8,together_ai,build-pmars,16951,4577,21528,196.1096,True,1.0,zai-org/GLM-4.5-Air-FP8,build-pmars,196.1096,True,0.6,True,196.1096 +ebc95ba1-88f2-4d35-acac-43692742a910,zai-org/GLM-4.5-Air-FP8,together_ai,count-dataset-tokens,18018,7470,25488,605.313678,False,0.0,zai-org/GLM-4.5-Air-FP8,count-dataset-tokens,605.313678,False,0.0,False,605.313678 +ae0c8810-8e4f-496a-9ca7-9e72d8046bb5,gpt-5-mini,openai,openssl-selfsigned-cert,2176,2291,4467,197.233028,True,1.0,gpt-5-mini,openssl-selfsigned-cert,197.233028,True,0.8,True,197.233028 +76db8ef1-d55b-4b76-82c2-7eeaa0ee9d73,claude-sonnet-4-20250514,anthropic,openssl-selfsigned-cert,1180,403,1583,1268.274704,False,0.0,claude-sonnet-4-20250514,openssl-selfsigned-cert,1268.274704,False,0.8,False,1268.274704 +bb850552-9147-4269-9a7f-0edb85891dee,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-c-py,4410,4528,8938,1009.323618,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-c-py,1009.323618,False,0.0,False,1009.323618 +61f28ccf-a7d3-4674-8fc3-c36c15b39e8f,moonshotai/Kimi-K2-Instruct-0905,together_ai,train-fasttext,13134,8620,21754,3198.453359,True,1.0,moonshotai/Kimi-K2-Instruct-0905,train-fasttext,3198.453359,True,0.2,True,3198.453359 +1ef92e4c-b367-4a6f-b7d7-67d2de7d6587,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing-reverse,21563,7519,29082,254.990001,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing-reverse,254.990001,False,0.0,False,254.990001 +9e6df700-6705-4b41-b1cc-467fb1074b63,gemini-2.5-pro,gemini,build-initramfs-qemu,4623,1789,6412,125.64759,False,0.0,gemini-2.5-pro,build-initramfs-qemu,125.64759,False,0.0,False,125.64759 +2c7ec8df-5d88-45c9-9e73-954e41eeffcb,grok-code-fast-1,xai,circuit-fibsqrt,2040,2117,4157,204.260426,False,0.0,grok-code-fast-1,circuit-fibsqrt,204.260426,False,0.0,False,204.260426 +8b92fefd-ddff-41ee-a57a-24fe7fdfcceb,deepseek-ai/DeepSeek-V3.1,together_ai,large-scale-text-editing,8590,8723,17313,827.301076,False,0.0,deepseek-ai/DeepSeek-V3.1,large-scale-text-editing,827.301076,False,0.0,False,827.301076 +76cf5a03-9456-4a71-b06e-325f103b3fd9,grok-4-0709,xai,build-cython-ext,10425,4922,15347,900.017413,False,0.0,grok-4-0709,build-cython-ext,900.017413,False,0.0,False,900.017413 +2d8ee2fc-2016-4245-9a1e-1d3ac4749918,OpenAI/gpt-oss-20B,together_ai,financial-document-processor,447,1545,1992,76.534794,False,0.0,OpenAI/gpt-oss-20B,financial-document-processor,76.534794,False,0.0,False,76.534794 +4b7c492e-dc66-4108-b1cc-1b6556c81c6b,claude-opus-4-1-20250805,anthropic,chess-best-move,8055,4559,12614,210.156209,False,0.0,claude-opus-4-1-20250805,chess-best-move,210.156209,False,0.0,False,210.156209 +59c76845-2ee2-4c71-8fc1-8fbbc5eeb900,gpt-5,openai,gpt2-codegolf,3622,3685,7307,909.627104,False,0.0,gpt-5,gpt2-codegolf,909.627104,False,0.0,False,909.627104 +d6acfbef-08ce-49ca-ad67-be04b9e885ad,grok-4-0709,xai,cancel-async-tasks,1115,521,1636,221.165722,False,0.0,grok-4-0709,cancel-async-tasks,221.165722,False,0.0,False,221.165722 +36f36bc0-00f8-4f7c-9be2-e32bdf87c159,gemini-2.5-flash,gemini,polyglot-rust-c,2185,1474,3659,905.47061,False,0.0,gemini-2.5-flash,polyglot-rust-c,905.47061,False,0.0,False,905.47061 +edba987e-f279-4308-824a-27050f2e10c4,gpt-5-nano,openai,prove-plus-comm,4301,4138,8439,900.023277,False,0.0,gpt-5-nano,prove-plus-comm,900.023277,False,0.4,False,900.023277 +147ee5a8-f2fb-4987-a5ac-38e2e6ee8929,openai/gpt-oss-120b,together_ai,feal-differential-cryptanalysis,1609,1161,2770,139.054137,False,0.0,openai/gpt-oss-120b,feal-differential-cryptanalysis,139.054137,False,0.0,False,139.054137 +edcf76a3-f793-47af-88e8-9c384dbd5c26,gpt-5-nano,openai,mteb-retrieve,4440,3910,8350,661.036411,False,0.0,gpt-5-nano,mteb-retrieve,661.036411,False,0.0,False,661.036411 +121ff17a-15ac-43eb-bf32-79cb28c00cee,claude-sonnet-4-20250514,anthropic,install-klee-minimal,20535,3215,23750,903.034968,False,0.0,claude-sonnet-4-20250514,install-klee-minimal,903.034968,False,0.0,False,903.034968 +e32be8d8-fd6b-4a05-b1ae-b3a3e7bdd55f,gemini-2.5-pro,gemini,prove-plus-comm,2215,2074,4289,227.05448,True,1.0,gemini-2.5-pro,prove-plus-comm,227.05448,True,0.8,True,227.05448 +3c1113be-ffdc-4de1-a295-0795935b2ff4,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,password-recovery,7194,6362,13556,796.656521,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,password-recovery,796.656521,True,0.2,True,796.656521 +fd0b345a-0e8a-4382-8f39-5335d3c6cf32,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,nginx-request-logging,7454,5045,12499,664.485247,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,nginx-request-logging,664.485247,True,0.4,True,664.485247 +e8e31986-ae94-4e34-81af-91c0c82aa908,gpt-5-nano,openai,make-doom-for-mips,11289,4558,15847,916.42802,False,0.0,gpt-5-nano,make-doom-for-mips,916.42802,False,0.0,False,916.42802 +3dbd774d-c9d1-4c47-a26a-aebf98a287b5,openai/gpt-oss-120b,together_ai,torch-tensor-parallelism,4015,3538,7553,574.500412,False,0.0,openai/gpt-oss-120b,torch-tensor-parallelism,574.500412,False,0.0,False,574.500412 +3153e3ab-3d98-4261-aa9e-a1c149b964aa,openai/gpt-oss-120b,together_ai,log-summary-date-ranges,2067,2091,4158,95.80214,False,0.0,openai/gpt-oss-120b,log-summary-date-ranges,95.80214,False,0.0,False,95.80214 +d17f5380-55a8-4cbf-a809-50e5f84e4d85,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing-reverse,19441,15529,34970,1475.115557,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing-reverse,1475.115557,False,0.0,False,1475.115557 +81866dec-0a7b-41b9-b34d-da7dbe0715a4,claude-sonnet-4-20250514,anthropic,distribution-search,14100,12136,26236,741.668815,True,1.0,claude-sonnet-4-20250514,distribution-search,741.668815,True,0.6,True,741.668815 +e434385a-a6fb-47b3-8186-f6955d2df967,gpt-5-mini,openai,model-extraction-relu-logits,1731,1359,3090,138.091196,False,0.0,gpt-5-mini,model-extraction-relu-logits,138.091196,False,0.0,False,138.091196 +b52b7e65-ce21-41cb-a3e6-5f956ab3c49f,grok-4-0709,xai,make-doom-for-mips,17289,3163,20452,909.325168,False,0.0,grok-4-0709,make-doom-for-mips,909.325168,False,0.0,False,909.325168 +fe991bdd-e5a8-4979-aefb-ae37e97f08eb,gpt-5,openai,make-mips-interpreter,809,1135,1944,1800.001333,False,0.0,gpt-5,make-mips-interpreter,1800.001333,False,0.0,False,1800.001333 +f28694ea-e1ec-45dc-9a07-4863f3418846,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-startup,1699,1327,3026,169.785717,False,0.0,deepseek-ai/DeepSeek-V3.1,qemu-startup,169.785717,False,0.2,False,169.785717 +fb125afa-5585-418f-ab83-032d673b27e7,gpt-5-nano,openai,model-extraction-relu-logits,2411,1944,4355,179.623617,False,0.0,gpt-5-nano,model-extraction-relu-logits,179.623617,False,0.0,False,179.623617 +3634371f-5cfa-4c2e-aa9d-dfa0dec47a6b,moonshotai/Kimi-K2-Instruct-0905,together_ai,password-recovery,5129,6529,11658,900.211672,False,0.0,moonshotai/Kimi-K2-Instruct-0905,password-recovery,900.211672,False,0.2,False,900.211672 +628ea5a3-9861-4ac7-aae1-c13980af9ad1,claude-sonnet-4-20250514,anthropic,large-scale-text-editing,3910,9452,13362,1243.338707,True,1.0,claude-sonnet-4-20250514,large-scale-text-editing,1243.338707,True,0.6,True,1243.338707 +623c665d-c336-4e94-8d21-e55ce2dd16bb,OpenAI/gpt-oss-20B,together_ai,dna-insert,2281,4109,6390,585.561517,False,0.0,OpenAI/gpt-oss-20B,dna-insert,585.561517,False,0.0,False,585.561517 +e6a01123-7302-40c0-bdf7-ef2ae4b34ae9,zai-org/GLM-4.5-Air-FP8,together_ai,torch-tensor-parallelism,1807,1523,3330,102.288619,False,0.0,zai-org/GLM-4.5-Air-FP8,torch-tensor-parallelism,102.288619,False,0.0,False,102.288619 +b4def6cd-da27-405b-b54f-a69b96fbb0fc,claude-opus-4-1-20250805,anthropic,break-filter-js-from-html,6863,7185,14048,1228.124283,False,0.0,claude-opus-4-1-20250805,break-filter-js-from-html,1228.124283,False,0.2222222222222222,False,1228.124283 +b785de13-5968-4e49-8825-ed9a5deb3571,zai-org/GLM-4.5-Air-FP8,together_ai,feal-linear-cryptanalysis,10532,6879,17411,440.10435,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-linear-cryptanalysis,440.10435,False,0.0,False,440.10435 +57d30762-11a8-4931-8177-c1f4ad095aa7,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-db-truncate,3550,1833,5383,212.356638,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-db-truncate,212.356638,False,0.0,False,212.356638 +5fbe8bbc-cc8d-4e70-b4c3-063c931f99fa,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pmars,15201,5167,20368,612.808052,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pmars,612.808052,True,1.0,True,612.808052 +21fb9e43-1658-4e4c-a923-d7735aabc3c2,gpt-5,openai,build-initramfs-qemu,3243,2579,5822,929.613089,False,0.0,gpt-5,build-initramfs-qemu,929.613089,False,0.0,False,929.613089 +d73d427c-a78a-47a5-8994-5c1b06869a3e,claude-opus-4-1-20250805,anthropic,extract-elf,10355,7526,17881,323.859053,True,1.0,claude-opus-4-1-20250805,extract-elf,323.859053,True,0.8888888888888888,True,323.859053 +9ef3a495-c9ee-45d7-819c-c274a66a64c4,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,vulnerable-secret,2398,2363,4761,908.632177,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,vulnerable-secret,908.632177,False,0.0,False,908.632177 +d60b7f97-eb79-4057-8ca9-9abe9b9db591,gpt-5,openai,git-leak-recovery,1696,1054,2750,109.092514,True,1.0,gpt-5,git-leak-recovery,109.092514,True,0.7142857142857143,True,109.092514 +8f78de3c-61dd-43a5-a8fa-d6cbc706b597,claude-opus-4-1-20250805,anthropic,extract-elf,6039,2734,8773,251.076883,True,1.0,claude-opus-4-1-20250805,extract-elf,251.076883,True,0.8888888888888888,True,251.076883 +2d6871f2-784a-436e-9972-739d90c258af,claude-sonnet-4-20250514,anthropic,merge-diff-arc-agi-task,19520,9341,28861,798.267702,False,0.0,claude-sonnet-4-20250514,merge-diff-arc-agi-task,798.267702,False,0.0,False,798.267702 +e19791a2-18bb-48be-b6c1-a571f73ed317,claude-sonnet-4-20250514,anthropic,train-fasttext,52073,16375,68448,3632.178211,False,0.0,claude-sonnet-4-20250514,train-fasttext,3632.178211,False,0.0,False,3632.178211 +a8ba26b7-655c-4485-983a-a3a3d551f68e,OpenAI/gpt-oss-20B,together_ai,constraints-scheduling,648,3810,4458,311.04735,False,0.0,OpenAI/gpt-oss-20B,constraints-scheduling,311.04735,False,0.2,False,311.04735 +07bec61b-b81e-430f-89af-0cd357b06d3b,OpenAI/gpt-oss-20B,together_ai,chess-best-move,8822,12098,20920,835.851092,False,0.0,OpenAI/gpt-oss-20B,chess-best-move,835.851092,False,0.0,False,835.851092 +599e85e8-e990-4392-a213-0609027773a8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,run-pdp11-code,4237,1221,5458,309.008897,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,run-pdp11-code,309.008897,False,0.0,False,309.008897 +dcec8655-8344-45ff-ae61-00efa79f4234,grok-code-fast-1,xai,form-filling,4218,2516,6734,86.797682,False,0.0,grok-code-fast-1,form-filling,86.797682,False,0.6,False,86.797682 +83ff0bfd-63ae-4cd1-959f-13edd7c0d9e2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,winning-avg-corewars,12096,10798,22894,2500.151304,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,winning-avg-corewars,2500.151304,False,0.0,False,2500.151304 +ca690874-e570-4744-8edf-6cda0825e7c6,grok-4-0709,xai,dna-insert,1103,435,1538,383.523004,False,0.0,grok-4-0709,dna-insert,383.523004,False,0.0,False,383.523004 +8838b73f-5c99-439a-b254-f32398a23712,claude-sonnet-4-20250514,anthropic,configure-git-webserver,8867,3816,12683,411.967293,True,1.0,claude-sonnet-4-20250514,configure-git-webserver,411.967293,True,0.6,True,411.967293 +ce1ba356-19d9-43bb-bae1-220cb6d8d8bc,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pypi-server,20983,7159,28142,905.443565,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pypi-server,905.443565,False,0.0,False,905.443565 +e85a7a39-5de6-4f26-9fc7-418f7cfcda46,gemini-2.5-pro,gemini,tune-mjcf,6608,6948,13556,900.002714,False,0.0,gemini-2.5-pro,tune-mjcf,900.002714,False,0.2,False,900.002714 +7003de2c-f21a-47a1-8f84-e7328d41e32f,gemini-2.5-pro,gemini,dna-insert,6698,2850,9548,377.755718,False,0.0,gemini-2.5-pro,dna-insert,377.755718,False,0.0,False,377.755718 +c27036eb-23fc-40ce-a313-7a0fc794c843,gpt-5-nano,openai,vulnerable-secret,3316,4095,7411,901.541733,False,0.0,gpt-5-nano,vulnerable-secret,901.541733,False,0.2,False,901.541733 +b4e61eba-c320-4f78-a1f2-263dfe3d793d,grok-4-0709,xai,polyglot-c-py,1169,638,1807,166.432063,False,0.0,grok-4-0709,polyglot-c-py,166.432063,False,0.6,False,166.432063 +b7071872-cfef-42fc-8a08-a1f8d172ce73,grok-4-0709,xai,cancel-async-tasks,1048,752,1800,194.211972,False,0.0,grok-4-0709,cancel-async-tasks,194.211972,False,0.0,False,194.211972 +6f65eda1-c81b-4f27-998a-10a5aa38b875,grok-code-fast-1,xai,break-filter-js-from-html,6659,7507,14166,582.49914,False,0.0,grok-code-fast-1,break-filter-js-from-html,582.49914,False,0.0,False,582.49914 +ca764b9d-cd5e-4566-8e75-4d1075a4ac13,gpt-5-nano,openai,video-processing,3504,3414,6918,273.32696,False,0.0,gpt-5-nano,video-processing,273.32696,False,0.0,False,273.32696 +043a46ec-1d45-4bc7-b47e-950dddd336ec,gemini-2.5-flash,gemini,qemu-alpine-ssh,1822,2395,4217,282.816872,False,0.0,gemini-2.5-flash,qemu-alpine-ssh,282.816872,False,0.0,False,282.816872 +03c00b2b-cd16-4db1-b0f7-ff5c0b64853b,gemini-2.5-flash,gemini,build-initramfs-qemu,4612,2995,7607,382.629468,False,0.0,gemini-2.5-flash,build-initramfs-qemu,382.629468,False,0.0,False,382.629468 +4a7b5122-cf42-441e-989d-8495d975beab,gpt-5-mini,openai,extract-elf,5297,3757,9054,277.409099,False,0.0,gpt-5-mini,extract-elf,277.409099,False,0.6,False,277.409099 +7e2eb257-28ac-49eb-9c18-24b2c50a5d36,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-retrieve,4488,3633,8121,556.153563,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-retrieve,556.153563,False,0.0,False,556.153563 +5d857a44-8392-437f-95e9-49a69092d33e,gemini-2.5-flash,gemini,torch-tensor-parallelism,987,4075,5062,902.001107,False,0.0,gemini-2.5-flash,torch-tensor-parallelism,902.001107,False,0.0,False,902.001107 +0bd8e410-1d71-4e28-a1d3-40ea9b9a3567,gemini-2.5-flash,gemini,largest-eigenval,12673,15899,28572,900.235319,False,0.0,gemini-2.5-flash,largest-eigenval,900.235319,False,0.0,False,900.235319 +19a1e6fa-f010-4109-8e53-dd1813cee283,openai/gpt-oss-120b,together_ai,password-recovery,6609,3228,9837,907.98809,False,0.0,openai/gpt-oss-120b,password-recovery,907.98809,False,0.2,False,907.98809 +d1a0fa61-58d0-47e6-81d5-11f7d52a8c34,zai-org/GLM-4.5-Air-FP8,together_ai,port-compressor,58844,42304,101148,917.273604,False,0.0,zai-org/GLM-4.5-Air-FP8,port-compressor,917.273604,False,0.0,False,917.273604 +4b489bc8-c291-4280-87fe-f3e78f744c15,moonshotai/Kimi-K2-Instruct-0905,together_ai,train-fasttext,23434,20305,43739,3600.8256,False,0.0,moonshotai/Kimi-K2-Instruct-0905,train-fasttext,3600.8256,False,0.2,False,3600.8256 +c125a170-7f90-45af-92a6-9eaa937e06bd,OpenAI/gpt-oss-20B,together_ai,path-tracing-reverse,585,3250,3835,241.013619,False,0.0,OpenAI/gpt-oss-20B,path-tracing-reverse,241.013619,False,0.0,False,241.013619 +0623dc91-fa40-4bca-977d-22980b15e100,claude-opus-4-1-20250805,anthropic,count-dataset-tokens,6848,3322,10170,279.409725,False,0.0,claude-opus-4-1-20250805,count-dataset-tokens,279.409725,False,0.0,False,279.409725 +c020c02b-6cf4-4bd0-a81b-2bcd96c01deb,deepseek-ai/DeepSeek-V3.1,together_ai,build-pmars,10132,2742,12874,424.46778,True,1.0,deepseek-ai/DeepSeek-V3.1,build-pmars,424.46778,True,1.0,True,424.46778 +84a66352-d4c9-49fd-83cd-29d0cd71a38e,OpenAI/gpt-oss-20B,together_ai,pypi-server,2036,2007,4043,243.136054,False,0.0,OpenAI/gpt-oss-20B,pypi-server,243.136054,False,0.2,False,243.136054 +455c0a68-89d0-4c39-b0f6-ca8ccaf3d0fc,claude-opus-4-1-20250805,anthropic,reverse-engineering,14637,8998,23635,746.129547,False,0.0,claude-opus-4-1-20250805,reverse-engineering,746.129547,False,0.0,False,746.129547 +c941f4df-e03f-4abf-ad88-8de43c3be3bf,OpenAI/gpt-oss-20B,together_ai,build-pov-ray,4523,1885,6408,110.50938,False,0.0,OpenAI/gpt-oss-20B,build-pov-ray,110.50938,False,0.0,False,110.50938 +a1e18589-587a-436e-bb26-1c2b2f166a92,claude-opus-4-1-20250805,anthropic,extract-elf,6343,2695,9038,495.15662,False,0.0,claude-opus-4-1-20250805,extract-elf,495.15662,False,0.8888888888888888,False,495.15662 +fab04615-c0e9-49be-83c7-677317673e0c,gpt-5-nano,openai,configure-git-webserver,7911,3995,11906,548.32542,False,0.0,gpt-5-nano,configure-git-webserver,548.32542,False,0.2,False,548.32542 +bd2ae3a3-ae0c-45d4-8537-dd0755ab7dfd,moonshotai/Kimi-K2-Instruct-0905,together_ai,db-wal-recovery,8077,4330,12407,910.921974,False,0.0,moonshotai/Kimi-K2-Instruct-0905,db-wal-recovery,910.921974,False,0.0,False,910.921974 +55b022c0-cf29-431d-8fb3-cb8f4e791acd,gemini-2.5-flash,gemini,prove-plus-comm,3742,4402,8144,900.030109,False,0.0,gemini-2.5-flash,prove-plus-comm,900.030109,False,0.6,False,900.030109 +c4b5e27a-f695-47a5-9927-a5b079f43212,gpt-5-mini,openai,reverse-engineering,10577,18078,28655,1800.059452,False,0.0,gpt-5-mini,reverse-engineering,1800.059452,False,0.0,False,1800.059452 +0629b802-6f0c-4fbe-850d-5ddd8edda6f9,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reshard-c4-data,11770,10648,22418,920.520015,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reshard-c4-data,920.520015,False,0.0,False,920.520015 +0150b187-e0e9-4828-a85a-e1d6fa539f86,openai/gpt-oss-120b,together_ai,openssl-selfsigned-cert,1997,1149,3146,115.492058,True,1.0,openai/gpt-oss-120b,openssl-selfsigned-cert,115.492058,True,0.8,True,115.492058 +223908dc-2738-4e5c-a9f0-f38df2118d0e,gemini-2.5-flash,gemini,bn-fit-modify,18221,21271,39492,3620.176057,False,0.0,gemini-2.5-flash,bn-fit-modify,3620.176057,False,0.0,False,3620.176057 +70e3ed36-c854-4e7a-bb43-90fd8dc04dc5,gemini-2.5-pro,gemini,cobol-modernization,4470,2997,7467,913.022822,True,1.0,gemini-2.5-pro,cobol-modernization,913.022822,True,1.0,True,913.022822 +2d16700d-01c1-4eb9-b6fe-72fd28afbef0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-code-vulnerability,13476,6341,19817,909.955602,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-code-vulnerability,909.955602,False,0.0,False,909.955602 +46a6738a-f320-454b-8109-a38fc5a7b9c7,grok-code-fast-1,xai,db-wal-recovery,1853,2039,3892,255.988499,False,0.0,grok-code-fast-1,db-wal-recovery,255.988499,False,0.0,False,255.988499 +0a34123c-a794-4328-8737-19ad0a7087d4,OpenAI/gpt-oss-20B,together_ai,chess-best-move,1717,2278,3995,57.042881,False,0.0,OpenAI/gpt-oss-20B,chess-best-move,57.042881,False,0.0,False,57.042881 +d270af73-c466-4b4f-987e-3f2fb5c5086a,gemini-2.5-pro,gemini,torch-tensor-parallelism,2248,1724,3972,91.335838,False,0.0,gemini-2.5-pro,torch-tensor-parallelism,91.335838,False,0.0,False,91.335838 +8e52bf68-bce6-402d-a94f-b0bd3feabb37,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-insert,4900,904,5804,372.595116,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-insert,372.595116,False,0.0,False,372.595116 +135617bc-1e75-4d46-a1f7-d793a1cb25f5,claude-opus-4-1-20250805,anthropic,make-doom-for-mips,18060,5486,23546,900.024907,False,0.0,claude-opus-4-1-20250805,make-doom-for-mips,900.024907,False,0.0,False,900.024907 +818d564b-80cf-490a-8854-29094810443a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,prove-plus-comm,1548,1503,3051,235.731166,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,prove-plus-comm,235.731166,False,0.0,False,235.731166 +e14de55c-b8f0-4fb5-8f14-f1587bbb00da,gemini-2.5-flash,gemini,mteb-leaderboard,1027,646,1673,163.401351,False,0.0,gemini-2.5-flash,mteb-leaderboard,163.401351,False,0.0,False,163.401351 +a6aa06dd-bb05-4352-a9f0-f0822d4f805c,claude-sonnet-4-20250514,anthropic,merge-diff-arc-agi-task,12361,5826,18187,901.797824,False,0.0,claude-sonnet-4-20250514,merge-diff-arc-agi-task,901.797824,False,0.0,False,901.797824 +ac754c85-be90-49e7-8647-43da78db4479,gemini-2.5-pro,gemini,password-recovery,7477,3669,11146,906.229453,False,0.0,gemini-2.5-pro,password-recovery,906.229453,False,0.0,False,906.229453 +163ae01a-b148-4b4b-ace9-20b989abf67d,moonshotai/Kimi-K2-Instruct-0905,together_ai,video-processing,4226,3347,7573,256.62703,False,0.0,moonshotai/Kimi-K2-Instruct-0905,video-processing,256.62703,False,0.0,False,256.62703 +d56cf36a-2b54-4729-9e7c-aa87f9276475,claude-sonnet-4-20250514,anthropic,adaptive-rejection-sampler,12542,6251,18793,780.211017,False,0.0,claude-sonnet-4-20250514,adaptive-rejection-sampler,780.211017,False,0.0,False,780.211017 +053f8996-cefb-46ab-9ef1-78234c2cf87c,OpenAI/gpt-oss-20B,together_ai,build-pmars,3501,11691,15192,926.337452,False,0.0,OpenAI/gpt-oss-20B,build-pmars,926.337452,False,0.0,False,926.337452 +0637f413-3133-44ff-aee1-76d8758bd7d8,grok-4-0709,xai,password-recovery,3399,1861,5260,904.304843,False,0.0,grok-4-0709,password-recovery,904.304843,False,0.0,False,904.304843 +5e803188-7216-4015-aab7-d930a2814045,moonshotai/Kimi-K2-Instruct-0905,together_ai,nginx-request-logging,6162,4336,10498,447.375746,True,1.0,moonshotai/Kimi-K2-Instruct-0905,nginx-request-logging,447.375746,True,0.4,True,447.375746 +f12084c2-0ae4-4b65-8270-751f35512c80,gpt-5,openai,git-leak-recovery,2032,1615,3647,87.398418,True,1.0,gpt-5,git-leak-recovery,87.398418,True,0.7142857142857143,True,87.398418 +2b6c5890-4caf-443f-aad0-3cf6b29704b5,grok-4-0709,xai,qemu-alpine-ssh,1772,1632,3404,361.872523,False,0.0,grok-4-0709,qemu-alpine-ssh,361.872523,False,0.0,False,361.872523 +996c40a4-da12-41f1-8249-672ed8804478,zai-org/GLM-4.5-Air-FP8,together_ai,form-filling,19226,23330,42556,520.001461,True,1.0,zai-org/GLM-4.5-Air-FP8,form-filling,520.001461,True,0.8,True,520.001461 +df04bd56-91b2-4f37-9997-3a6974ca55a5,gpt-5,openai,polyglot-c-py,1595,1520,3115,812.535531,False,0.0,gpt-5,polyglot-c-py,812.535531,False,0.0,False,812.535531 +5d1d38c7-c9f5-4b51-963c-ca8ca52dd2ec,claude-sonnet-4-20250514,anthropic,pytorch-model-cli,3487,1806,5293,900.001649,False,0.0,claude-sonnet-4-20250514,pytorch-model-cli,900.001649,False,0.4,False,900.001649 +49d55170-3b2d-4372-a4a2-022fe29bde8e,claude-opus-4-1-20250805,anthropic,sanitize-git-repo,2347,988,3335,900.000792,False,0.0,claude-opus-4-1-20250805,sanitize-git-repo,900.000792,False,0.0,False,900.000792 +461e5645-b536-46ca-ae64-54915d481555,gpt-5-nano,openai,form-filling,9603,14722,24325,900.001958,False,0.0,gpt-5-nano,form-filling,900.001958,False,0.6,False,900.001958 +965e09ab-6dbb-473b-8e80-1c6a9d50d954,gemini-2.5-flash,gemini,build-cython-ext,27288,8068,35356,906.126771,False,0.0,gemini-2.5-flash,build-cython-ext,906.126771,False,0.0,False,906.126771 +472a6762-ce4b-493d-bc5a-b0c35d9be076,gpt-5,openai,filter-js-from-html,2498,3240,5738,390.710676,False,0.0,gpt-5,filter-js-from-html,390.710676,False,0.0,False,390.710676 +df20efba-c0d8-4e72-81b5-6b1e6f4563ca,OpenAI/gpt-oss-20B,together_ai,torch-tensor-parallelism,174,152,326,30.224706,False,0.0,OpenAI/gpt-oss-20B,torch-tensor-parallelism,30.224706,False,0.0,False,30.224706 +10c38cce-7071-45e3-986f-353c400687c3,gpt-5-nano,openai,install-windows-3.11,15388,45048,60436,3607.163798,False,0.0,gpt-5-nano,install-windows-3.11,3607.163798,False,0.0,False,3607.163798 +fc560f56-a0e3-4f94-8d24-1b0420f273e6,zai-org/GLM-4.5-Air-FP8,together_ai,build-pov-ray,1790,1718,3508,822.825175,False,0.0,zai-org/GLM-4.5-Air-FP8,build-pov-ray,822.825175,False,0.0,False,822.825175 +b3060adf-9e7a-49e8-9cdb-255d0a55824e,gpt-5-nano,openai,fix-ocaml-gc,18897,17302,36199,3605.157478,False,0.0,gpt-5-nano,fix-ocaml-gc,3605.157478,False,0.0,False,3605.157478 +9d5baf9c-d9af-4c03-b0b8-4346dcfd1977,gpt-5-mini,openai,feal-linear-cryptanalysis,23602,20973,44575,1800.055538,False,0.0,gpt-5-mini,feal-linear-cryptanalysis,1800.055538,False,0.0,False,1800.055538 +a5671ed3-abda-46b2-a381-b0c600ce9d2a,gemini-2.5-flash,gemini,openssl-selfsigned-cert,2083,2325,4408,205.537988,False,0.0,gemini-2.5-flash,openssl-selfsigned-cert,205.537988,False,0.0,False,205.537988 +ae33265f-fab8-4850-abdf-1cfcd7174cfc,gpt-5,openai,feal-linear-cryptanalysis,28504,22199,50703,1599.371244,True,1.0,gpt-5,feal-linear-cryptanalysis,1599.371244,True,1.0,True,1599.371244 +f1af89f2-a910-427c-9636-b47e1804994a,claude-opus-4-1-20250805,anthropic,reshard-c4-data,7844,13944,21788,1729.501661,False,0.0,claude-opus-4-1-20250805,reshard-c4-data,1729.501661,False,0.0,False,1729.501661 +0335783f-744b-44be-b8ad-9a0ff983e200,gemini-2.5-pro,gemini,distribution-search,5752,6471,12223,356.706715,False,0.0,gemini-2.5-pro,distribution-search,356.706715,False,0.6,False,356.706715 +95140eb3-87a4-43f4-b332-e72e7853bee7,gpt-5-nano,openai,cobol-modernization,13207,12943,26150,901.324885,False,0.0,gpt-5-nano,cobol-modernization,901.324885,False,0.4,False,901.324885 +429e99de-f645-44c4-bb74-feded6c11639,grok-code-fast-1,xai,filter-js-from-html,1200,615,1815,32.701211,False,0.0,grok-code-fast-1,filter-js-from-html,32.701211,False,0.0,False,32.701211 +68f8aa93-d7fa-4ae9-b791-5d420f3cd223,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,tune-mjcf,13262,7597,20859,907.127844,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,tune-mjcf,907.127844,False,0.0,False,907.127844 +bf977a62-01be-461b-8f59-a89b02628300,deepseek-ai/DeepSeek-V3.1,together_ai,fix-code-vulnerability,12891,5737,18628,572.617767,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-code-vulnerability,572.617767,False,0.2,False,572.617767 +801a87e7-f9c7-40ff-affc-9c5b7b800f46,grok-4-0709,xai,openssl-selfsigned-cert,2082,1268,3350,242.801096,False,0.0,grok-4-0709,openssl-selfsigned-cert,242.801096,False,0.0,False,242.801096 +638a5d66-5dc4-4ba6-828a-123a901983c1,claude-opus-4-1-20250805,anthropic,db-wal-recovery,7537,6415,13952,254.539664,False,0.0,claude-opus-4-1-20250805,db-wal-recovery,254.539664,False,0.0,False,254.539664 +5542b648-ca61-4a74-a236-8d32a5aeff5c,gpt-5-nano,openai,torch-tensor-parallelism,16328,11106,27434,908.130843,False,0.0,gpt-5-nano,torch-tensor-parallelism,908.130843,False,0.0,False,908.130843 +fde7b665-7e20-40ea-9bcd-076e730aa57e,moonshotai/Kimi-K2-Instruct-0905,together_ai,code-from-image,15573,9305,24878,420.224504,False,0.0,moonshotai/Kimi-K2-Instruct-0905,code-from-image,420.224504,False,0.6,False,420.224504 +3b215da4-7131-43c4-a290-8a206faa1157,gemini-2.5-flash,gemini,regex-log,1380,697,2077,119.21774,True,1.0,gemini-2.5-flash,regex-log,119.21774,True,0.8,True,119.21774 +a9856963-833a-419b-8668-85e9e45c1175,moonshotai/Kimi-K2-Instruct-0905,together_ai,schemelike-metacircular-eval,21100,18460,39560,2406.577526,False,0.0,moonshotai/Kimi-K2-Instruct-0905,schemelike-metacircular-eval,2406.577526,False,0.0,False,2406.577526 +fc0a5e9f-368d-4891-a92e-05b6193c4e66,claude-sonnet-4-20250514,anthropic,adaptive-rejection-sampler,12385,10203,22588,906.989604,False,0.0,claude-sonnet-4-20250514,adaptive-rejection-sampler,906.989604,False,0.0,False,906.989604 +3c64f610-4a83-4697-8959-81374b14295c,openai/gpt-oss-120b,together_ai,prove-plus-comm,1872,1055,2927,192.563146,True,1.0,openai/gpt-oss-120b,prove-plus-comm,192.563146,True,1.0,True,192.563146 +092dccba-32eb-491d-b1df-db315b885144,gpt-5-mini,openai,build-pmars,7665,8101,15766,921.000067,False,0.0,gpt-5-mini,build-pmars,921.000067,False,0.2,False,921.000067 +b75addfe-e049-4cad-85b7-3c8cbff30918,grok-4-0709,xai,winning-avg-corewars,14562,19536,34098,3617.640234,False,0.0,grok-4-0709,winning-avg-corewars,3617.640234,False,0.0,False,3617.640234 +0c744cfe-aed4-4812-81b3-9f00ffdae064,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,largest-eigenval,6702,6072,12774,905.013828,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,largest-eigenval,905.013828,False,0.2,False,905.013828 +ea9fd1bb-f02d-4638-a0df-dd7b6012b96d,zai-org/GLM-4.5-Air-FP8,together_ai,sqlite-db-truncate,4260,5366,9626,485.715557,False,0.0,zai-org/GLM-4.5-Air-FP8,sqlite-db-truncate,485.715557,False,0.0,False,485.715557 +6b73e5ba-8a2c-4ee2-984e-1dd88b92edd1,gpt-5-nano,openai,model-extraction-relu-logits,1511,1166,2677,136.355575,False,0.0,gpt-5-nano,model-extraction-relu-logits,136.355575,False,0.0,False,136.355575 +85aa4dc2-4b65-4ed9-9b1b-060c97b3d881,grok-4-0709,xai,filter-js-from-html,1253,640,1893,266.375329,False,0.0,grok-4-0709,filter-js-from-html,266.375329,False,0.0,False,266.375329 +593b8ae4-9f1b-4e34-8253-0976e2f6db97,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,db-wal-recovery,2294,1657,3951,62.129188,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,db-wal-recovery,62.129188,False,0.0,False,62.129188 +52831039-8329-4868-b3f9-9b87fe32e787,gpt-5-mini,openai,wasm-pipeline,8578,7334,15912,474.52876,True,1.0,gpt-5-mini,wasm-pipeline,474.52876,True,0.6,True,474.52876 +512780bd-2799-47af-9c82-8aad4a47f567,OpenAI/gpt-oss-20B,together_ai,cobol-modernization,1412,2698,4110,211.925308,False,0.0,OpenAI/gpt-oss-20B,cobol-modernization,211.925308,False,0.0,False,211.925308 +41ada0fb-49c6-4f19-aa0f-114e211b4bab,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-doom-for-mips,19645,9960,29605,901.00345,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-doom-for-mips,901.00345,False,0.0,False,901.00345 +1fbd249c-4d0d-4973-b580-82522aaf5e7c,grok-4-0709,xai,torch-tensor-parallelism,1075,1583,2658,812.482565,False,0.0,grok-4-0709,torch-tensor-parallelism,812.482565,False,0.0,False,812.482565 +b6438a72-dbf2-409a-8095-03cd4feb0650,claude-opus-4-1-20250805,anthropic,build-pov-ray,16243,5103,21346,3200.760685,True,1.0,claude-opus-4-1-20250805,build-pov-ray,3200.760685,True,0.75,True,3200.760685 +10643166-85aa-4dfa-b28a-585ec4ba4ce7,openai/gpt-oss-120b,together_ai,form-filling,3538,1690,5228,60.202199,False,0.0,openai/gpt-oss-120b,form-filling,60.202199,False,0.6,False,60.202199 +2cacddc9-541f-486d-bbf7-d2e3e9a14136,claude-sonnet-4-20250514,anthropic,build-cython-ext,10717,2743,13460,954.120021,False,0.0,claude-sonnet-4-20250514,build-cython-ext,954.120021,False,0.0,False,954.120021 +0c465521-c4c7-4803-ab13-d77a9d9f8e23,claude-opus-4-1-20250805,anthropic,form-filling,16489,14403,30892,700.345711,True,1.0,claude-opus-4-1-20250805,form-filling,700.345711,True,1.0,True,700.345711 +dd0fca22-7153-4e63-8d9a-34a2eebe54bb,gpt-5-mini,openai,cancel-async-tasks,1836,1251,3087,80.501672,True,1.0,gpt-5-mini,cancel-async-tasks,80.501672,True,0.4,True,80.501672 +1dc5f35b-3e1f-474d-bd59-4d5ef6928bbc,grok-code-fast-1,xai,extract-elf,6277,4328,10605,340.772261,False,0.0,grok-code-fast-1,extract-elf,340.772261,False,0.6,False,340.772261 +8db551d9-2c26-4240-9690-62caf946da55,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,port-compressor,56852,33147,89999,3631.215361,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,port-compressor,3631.215361,False,0.0,False,3631.215361 +1354cfe7-e4c7-4885-ac40-12d8b56e40be,moonshotai/Kimi-K2-Instruct-0905,together_ai,git-leak-recovery,2563,2366,4929,241.844258,True,1.0,moonshotai/Kimi-K2-Instruct-0905,git-leak-recovery,241.844258,True,1.0,True,241.844258 +b17d3a4f-8dd6-4be9-8994-8c94e7baea62,grok-code-fast-1,xai,cancel-async-tasks,1198,667,1865,50.394023,False,0.0,grok-code-fast-1,cancel-async-tasks,50.394023,False,0.2,False,50.394023 +45fb63d0-b46d-4509-96d1-d546be30b372,claude-opus-4-1-20250805,anthropic,mteb-retrieve,2158,1411,3569,81.147327,False,0.0,claude-opus-4-1-20250805,mteb-retrieve,81.147327,False,0.0,False,81.147327 +651239f2-6eae-42f9-9d5a-6c3a0e804e4b,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-with-gcov,9402,1484,10886,410.989663,True,1.0,deepseek-ai/DeepSeek-V3.1,sqlite-with-gcov,410.989663,True,0.8,True,410.989663 +98af9e50-52ee-4dbf-8410-e153ac044635,zai-org/GLM-4.5-Air-FP8,together_ai,openssl-selfsigned-cert,2045,1757,3802,57.877799,False,0.0,zai-org/GLM-4.5-Air-FP8,openssl-selfsigned-cert,57.877799,False,0.0,False,57.877799 +d0f3aada-4fde-403b-8b42-d3f7ffa51204,deepseek-ai/DeepSeek-V3.1,together_ai,cobol-modernization,8269,6094,14363,774.324846,False,0.0,deepseek-ai/DeepSeek-V3.1,cobol-modernization,774.324846,False,0.6,False,774.324846 +e3191908-bc63-4d5d-8db9-1995d863ef37,claude-sonnet-4-20250514,anthropic,wasm-pipeline,9862,5637,15499,474.62786,False,0.0,claude-sonnet-4-20250514,wasm-pipeline,474.62786,False,0.6,False,474.62786 +1f1d6ef1-be2e-4ef5-907f-c13ab80724c4,claude-opus-4-1-20250805,anthropic,code-from-image,1986,952,2938,1971.751474,False,0.0,claude-opus-4-1-20250805,code-from-image,1971.751474,False,0.125,False,1971.751474 +69f0f0fd-0164-4323-8bd5-703646feffe9,grok-4-0709,xai,crack-7z-hash,8392,2929,11321,524.937764,True,1.0,grok-4-0709,crack-7z-hash,524.937764,True,0.8,True,524.937764 +5c608902-1e53-4c3f-a80a-748d8db22af9,deepseek-ai/DeepSeek-V3.1,together_ai,schemelike-metacircular-eval,36382,37041,73423,2320.406535,False,0.0,deepseek-ai/DeepSeek-V3.1,schemelike-metacircular-eval,2320.406535,False,0.0,False,2320.406535 +6d885e3b-9105-4172-8976-aeeae03ed579,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-retrieve,6375,3641,10016,420.028343,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-retrieve,420.028343,False,0.0,False,420.028343 +3bb03f30-e18b-4f4f-a320-aac0d1896623,OpenAI/gpt-oss-20B,together_ai,build-initramfs-qemu,1458,986,2444,49.997346,False,0.0,OpenAI/gpt-oss-20B,build-initramfs-qemu,49.997346,False,0.0,False,49.997346 +4e3b12d9-097a-41cc-9cb9-76841944c92c,grok-4-0709,xai,make-doom-for-mips,19171,3292,22463,610.240123,False,0.0,grok-4-0709,make-doom-for-mips,610.240123,False,0.0,False,610.240123 +ee4d7c74-c247-4ff3-9e0d-8cadcfe5fa99,gpt-5-nano,openai,make-doom-for-mips,10829,5731,16560,912.645415,False,0.0,gpt-5-nano,make-doom-for-mips,912.645415,False,0.0,False,912.645415 +65350c5b-6ca5-4310-b638-dfed4526d13b,openai/gpt-oss-120b,together_ai,circuit-fibsqrt,7229,5979,13208,706.457559,False,0.0,openai/gpt-oss-120b,circuit-fibsqrt,706.457559,False,0.0,False,706.457559 +69974c12-9460-4e5c-976a-bcf1cdba8684,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-recovery,19917,6218,26135,904.304517,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-recovery,904.304517,False,0.0,False,904.304517 +a84d82d0-060b-4cfc-98bb-a36b1399d47a,grok-code-fast-1,xai,sqlite-with-gcov,1161,830,1991,159.549124,False,0.0,grok-code-fast-1,sqlite-with-gcov,159.549124,False,0.2,False,159.549124 +ebfa2537-798b-4756-b92b-bb9b40642e94,moonshotai/Kimi-K2-Instruct-0905,together_ai,constraints-scheduling,7877,6252,14129,601.522393,True,1.0,moonshotai/Kimi-K2-Instruct-0905,constraints-scheduling,601.522393,True,0.6,True,601.522393 +bf0a7563-be09-460b-b693-c4d97dc2de75,gpt-5,openai,mteb-retrieve,2017,1054,3071,215.725581,False,0.0,gpt-5,mteb-retrieve,215.725581,False,0.0,False,215.725581 +b8b258dd-b1e0-459d-af32-020af83bf977,gemini-2.5-pro,gemini,sqlite-with-gcov,8133,1667,9800,319.10009,False,0.0,gemini-2.5-pro,sqlite-with-gcov,319.10009,False,0.8,False,319.10009 +6d87c5d4-8d86-41e8-96ce-8eb2e6f9856e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,extract-elf,11624,5975,17599,739.631058,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,extract-elf,739.631058,False,0.6,False,739.631058 +061275aa-d075-4b06-a631-2beb561da44b,deepseek-ai/DeepSeek-V3.1,together_ai,password-recovery,12919,7337,20256,915.1463,False,0.0,deepseek-ai/DeepSeek-V3.1,password-recovery,915.1463,False,0.0,False,915.1463 +e8566611-72b9-42d3-abc8-c97a9e87451a,gemini-2.5-flash,gemini,chess-best-move,16207,17352,33559,900.511685,False,0.0,gemini-2.5-flash,chess-best-move,900.511685,False,0.0,False,900.511685 +3742f7fd-53b0-4929-8c19-9f94b828f836,grok-4-0709,xai,qemu-startup,1951,2764,4715,916.980591,False,0.0,grok-4-0709,qemu-startup,916.980591,False,0.4,False,916.980591 +3f6bff5b-608c-4ef4-8f5b-701c1eacc719,gemini-2.5-flash,gemini,install-windows-3.11,2778,2876,5654,254.501894,False,0.0,gemini-2.5-flash,install-windows-3.11,254.501894,False,0.0,False,254.501894 +9030fee1-e03c-412e-a189-a1021b294bfc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sparql-university,1515,782,2297,102.630775,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sparql-university,102.630775,False,0.0,False,102.630775 +8d45bd04-bc18-4ce0-af7f-c9c8446aaeba,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,reverse-engineering,4274,3221,7495,503.58089,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reverse-engineering,503.58089,False,0.0,False,503.58089 +210864df-ec02-4e28-bfec-cc844c5994fc,zai-org/GLM-4.5-Air-FP8,together_ai,chess-best-move,17965,8324,26289,728.487402,False,0.0,zai-org/GLM-4.5-Air-FP8,chess-best-move,728.487402,False,0.0,False,728.487402 +9c5e1511-769a-46ef-bdf9-e99f40d6af62,gemini-2.5-flash,gemini,write-compressor,4168,3777,7945,825.210902,False,0.0,gemini-2.5-flash,write-compressor,825.210902,False,0.0,False,825.210902 +750995cc-8759-4aea-a1c7-08a418cde7f7,claude-opus-4-1-20250805,anthropic,regex-log,4050,4283,8333,156.21718,True,1.0,claude-opus-4-1-20250805,regex-log,156.21718,True,0.5714285714285714,True,156.21718 +40e7bb68-125a-4b22-818a-99f6f388619c,moonshotai/Kimi-K2-Instruct-0905,together_ai,count-dataset-tokens,15218,5577,20795,850.509198,True,1.0,moonshotai/Kimi-K2-Instruct-0905,count-dataset-tokens,850.509198,True,0.2,True,850.509198 +4b17eecb-0f5f-405a-87a8-d3d9f5d254ed,gemini-2.5-flash,gemini,distribution-search,42805,50967,93772,3603.911274,False,0.0,gemini-2.5-flash,distribution-search,3603.911274,False,0.0,False,3603.911274 +70fdd6cf-e4da-4bbb-968c-92675bbbcd99,zai-org/GLM-4.5-Air-FP8,together_ai,hf-model-inference,5109,4324,9433,363.338164,True,1.0,zai-org/GLM-4.5-Air-FP8,hf-model-inference,363.338164,True,0.8,True,363.338164 +bf7cee47-a4d6-4b73-9a3b-fb9c6a3d64f7,gemini-2.5-pro,gemini,install-windows-3.11,31000,11432,42432,3644.88457,False,0.0,gemini-2.5-pro,install-windows-3.11,3644.88457,False,0.0,False,3644.88457 +afaac7c3-cb40-4ff3-a4bd-3ba920347e6c,gemini-2.5-pro,gemini,mteb-leaderboard,2847,1853,4700,400.520879,False,0.0,gemini-2.5-pro,mteb-leaderboard,400.520879,False,0.0,False,400.520879 +696475cc-0591-4ef0-8b6f-21b644a9277a,gpt-5-mini,openai,vulnerable-secret,12246,5326,17572,446.983423,True,1.0,gpt-5-mini,vulnerable-secret,446.983423,True,0.4,True,446.983423 +979d7f90-e29a-4f5f-ae4f-4388beb6dcad,grok-code-fast-1,xai,mteb-retrieve,1978,981,2959,52.264941,False,0.0,grok-code-fast-1,mteb-retrieve,52.264941,False,0.0,False,52.264941 +a11648c9-06fc-4c98-b81f-04eb1403f241,gemini-2.5-flash,gemini,run-pdp11-code,6659,7175,13834,199.612664,False,0.0,gemini-2.5-flash,run-pdp11-code,199.612664,False,0.0,False,199.612664 +7fe3e457-630a-41b7-b9c7-d07b66991bf0,gemini-2.5-pro,gemini,polyglot-rust-c,1847,2656,4503,544.45041,False,0.0,gemini-2.5-pro,polyglot-rust-c,544.45041,False,0.0,False,544.45041 +b3329310-2870-4d7c-993f-e1aafe12dd8e,claude-sonnet-4-20250514,anthropic,qemu-startup,5711,7536,13247,909.511829,False,0.0,claude-sonnet-4-20250514,qemu-startup,909.511829,False,0.4,False,909.511829 +db525db7-157f-49e2-bf25-739f60dc2e52,gpt-5-mini,openai,make-mips-interpreter,26199,31822,58021,1800.005615,False,0.0,gpt-5-mini,make-mips-interpreter,1800.005615,False,0.0,False,1800.005615 +00dab5a2-1493-4eaa-ac3a-1753dc0afc40,gemini-2.5-flash,gemini,prove-plus-comm,1315,1081,2396,195.506131,False,0.0,gemini-2.5-flash,prove-plus-comm,195.506131,False,0.6,False,195.506131 +0e56eaff-4316-4999-b939-3bcb50d11950,deepseek-ai/DeepSeek-V3.1,together_ai,filter-js-from-html,2859,2048,4907,277.571057,False,0.0,deepseek-ai/DeepSeek-V3.1,filter-js-from-html,277.571057,False,0.0,False,277.571057 +6a0230e5-b755-439c-845e-c652bf805aeb,deepseek-ai/DeepSeek-V3.1,together_ai,mteb-leaderboard,1538,1253,2791,100.276781,False,0.0,deepseek-ai/DeepSeek-V3.1,mteb-leaderboard,100.276781,False,0.0,False,100.276781 +fe450c50-fa93-43fa-a7f6-5063274306f1,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,regex-log,1434,733,2167,46.768913,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,regex-log,46.768913,False,0.0,False,46.768913 +3cde7713-8499-4c45-aa48-2929cd9c6b49,claude-sonnet-4-20250514,anthropic,sqlite-db-truncate,5941,3960,9901,279.11761,False,0.0,claude-sonnet-4-20250514,sqlite-db-truncate,279.11761,False,0.0,False,279.11761 +c852d816-d4fd-432f-b502-aae29519c613,moonshotai/Kimi-K2-Instruct-0905,together_ai,cobol-modernization,16910,16564,33474,914.722451,True,1.0,moonshotai/Kimi-K2-Instruct-0905,cobol-modernization,914.722451,True,0.6,True,914.722451 +cfed86a5-f3cd-43a6-9098-4cb5001731bd,gemini-2.5-flash,gemini,circuit-fibsqrt,32580,139155,171735,3600.086186,False,0.0,gemini-2.5-flash,circuit-fibsqrt,3600.086186,False,0.0,False,3600.086186 +283be447-df8c-433e-b586-e5c41031ab99,claude-sonnet-4-20250514,anthropic,pypi-server,2003,1574,3577,1013.456787,False,0.0,claude-sonnet-4-20250514,pypi-server,1013.456787,False,0.8,False,1013.456787 +5e080ce5-9c64-4547-965d-d696d130cdff,gpt-5-nano,openai,fix-code-vulnerability,12079,6329,18408,482.756827,True,1.0,gpt-5-nano,fix-code-vulnerability,482.756827,True,0.2,True,482.756827 +f050894e-2717-4831-9cd8-09d9d7fcf54b,gemini-2.5-flash,gemini,make-mips-interpreter,28943,73214,102157,2074.266498,False,0.0,gemini-2.5-flash,make-mips-interpreter,2074.266498,False,0.0,False,2074.266498 +6ac99586-2b2a-4998-aa9a-efb2375a54ce,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,git-leak-recovery,2245,1796,4041,290.474758,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,git-leak-recovery,290.474758,True,1.0,True,290.474758 +ca4278e7-3cea-411a-86cb-bac0d3ade1d9,gemini-2.5-pro,gemini,polyglot-c-py,1531,1762,3293,346.035359,False,0.0,gemini-2.5-pro,polyglot-c-py,346.035359,False,0.2,False,346.035359 +22d41929-c806-4483-9e54-00b739095465,grok-code-fast-1,xai,wasm-pipeline,5852,2047,7899,223.040669,False,0.0,grok-code-fast-1,wasm-pipeline,223.040669,False,0.2,False,223.040669 +b786acb0-2081-4b74-9fa4-9e996d8700a5,claude-opus-4-1-20250805,anthropic,reshard-c4-data,12415,7050,19465,294.257391,False,0.0,claude-opus-4-1-20250805,reshard-c4-data,294.257391,False,0.0,False,294.257391 +92f03e5e-f64d-4837-ba30-bdeff5bcc39f,grok-4-0709,xai,large-scale-text-editing,2421,1482,3903,631.20016,True,1.0,grok-4-0709,large-scale-text-editing,631.20016,True,0.4,True,631.20016 +1c1e07c9-754b-4a7f-8f06-9ee94e507748,claude-opus-4-1-20250805,anthropic,financial-document-processor,9941,3801,13742,193.840313,False,0.0,claude-opus-4-1-20250805,financial-document-processor,193.840313,False,0.0,False,193.840313 +cfd19a89-1abe-4c5c-9012-cabfa936a0b4,OpenAI/gpt-oss-20B,together_ai,financial-document-processor,1122,2297,3419,99.55459,False,0.0,OpenAI/gpt-oss-20B,financial-document-processor,99.55459,False,0.0,False,99.55459 +835a120d-c9f8-4aae-b3f5-4782d58e004c,gpt-5-nano,openai,sparql-university,10754,9978,20732,923.192472,False,0.0,gpt-5-nano,sparql-university,923.192472,False,0.0,False,923.192472 +741cef4b-4f50-4cc5-8c41-9c2ea1e0ba65,grok-4-0709,xai,polyglot-c-py,1655,955,2610,280.463774,True,1.0,grok-4-0709,polyglot-c-py,280.463774,True,0.6,True,280.463774 +55abd204-1219-4a73-9d7f-63981a2c1251,moonshotai/Kimi-K2-Instruct-0905,together_ai,hf-model-inference,7027,5925,12952,686.606258,False,0.0,moonshotai/Kimi-K2-Instruct-0905,hf-model-inference,686.606258,False,0.0,False,686.606258 +432ad616-576f-48b7-b8fc-82fef748ffa1,openai/gpt-oss-120b,together_ai,run-pdp11-code,2157,2258,4415,1095.415645,False,0.0,openai/gpt-oss-120b,run-pdp11-code,1095.415645,False,0.0,False,1095.415645 +99adc89e-1af6-42ec-97ca-16e808ff80f5,gemini-2.5-flash,gemini,prove-plus-comm,2847,2902,5749,307.628228,True,1.0,gemini-2.5-flash,prove-plus-comm,307.628228,True,0.6,True,307.628228 +0d593502-a027-415c-bfc6-71412ce4999a,claude-sonnet-4-20250514,anthropic,fix-ocaml-gc,25645,9395,35040,3837.073705,False,0.0,claude-sonnet-4-20250514,fix-ocaml-gc,3837.073705,False,0.0,False,3837.073705 +de9ae622-be1b-427e-8956-ec9391d0dff9,gemini-2.5-flash,gemini,pypi-server,4121,1573,5694,122.966065,False,0.0,gemini-2.5-flash,pypi-server,122.966065,False,0.0,False,122.966065 +2affbd25-6505-4fa8-8919-0d29c8e0ceb7,claude-opus-4-1-20250805,anthropic,distribution-search,5983,4813,10796,256.920603,True,1.0,claude-opus-4-1-20250805,distribution-search,256.920603,True,0.5555555555555556,True,256.920603 +438136c8-3469-43f7-8342-8d2d3fbadce4,gemini-2.5-pro,gemini,code-from-image,8963,1843,10806,194.843998,True,1.0,gemini-2.5-pro,code-from-image,194.843998,True,1.0,True,194.843998 +395723e2-c50c-4bdb-8a94-d0353f337d4e,openai/gpt-oss-120b,together_ai,fix-git,8155,4045,12200,905.16125,False,0.0,openai/gpt-oss-120b,fix-git,905.16125,False,0.6,False,905.16125 +b0949005-d326-4368-bb29-5a4d5498bd7d,gpt-5-nano,openai,sparql-university,3281,1311,4592,103.284168,False,0.0,gpt-5-nano,sparql-university,103.284168,False,0.0,False,103.284168 +81384866-4394-4f78-a506-af497faf7496,gpt-5,openai,filter-js-from-html,2586,2766,5352,296.645272,False,0.0,gpt-5,filter-js-from-html,296.645272,False,0.0,False,296.645272 +6880c3c6-dc10-4fa4-89a1-15bb36475bc2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,tune-mjcf,9170,9144,18314,926.405488,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,tune-mjcf,926.405488,False,0.0,False,926.405488 +f5dae9b2-744e-4e6c-a873-872b5acbf278,grok-4-0709,xai,adaptive-rejection-sampler,7825,3119,10944,906.756728,False,0.0,grok-4-0709,adaptive-rejection-sampler,906.756728,False,0.0,False,906.756728 +73b8911b-f3d3-454f-a837-e3453ea2078d,zai-org/GLM-4.5-Air-FP8,together_ai,large-scale-text-editing,3796,6134,9930,1200.820858,False,0.0,zai-org/GLM-4.5-Air-FP8,large-scale-text-editing,1200.820858,False,0.0,False,1200.820858 +605dbc0e-1ad7-4eae-908c-c88d4ed19720,claude-sonnet-4-20250514,anthropic,feal-linear-cryptanalysis,20039,18964,39003,1800.68162,False,0.0,claude-sonnet-4-20250514,feal-linear-cryptanalysis,1800.68162,False,0.0,False,1800.68162 +adc1a977-1904-489f-bc6c-17e19fc5abe5,grok-4-0709,xai,mteb-leaderboard,925,408,1333,155.60713,False,0.0,grok-4-0709,mteb-leaderboard,155.60713,False,0.0,False,155.60713 +0549246a-7425-4526-8c38-60f97574c8d9,zai-org/GLM-4.5-Air-FP8,together_ai,train-fasttext,16553,5982,22535,3605.987934,False,0.0,zai-org/GLM-4.5-Air-FP8,train-fasttext,3605.987934,False,0.2,False,3605.987934 +bd7138f8-a29d-4a6a-83aa-dd9c2f4137e1,gemini-2.5-flash,gemini,train-fasttext,16952,8382,25334,3602.629325,False,0.0,gemini-2.5-flash,train-fasttext,3602.629325,False,0.0,False,3602.629325 +b376b093-070b-4b0f-bf81-05d08cac6d49,claude-opus-4-1-20250805,anthropic,make-mips-interpreter,36656,30020,66676,1815.706967,False,0.0,claude-opus-4-1-20250805,make-mips-interpreter,1815.706967,False,0.0,False,1815.706967 +9bd3fbac-ab22-40f5-8afc-def6c2749c08,grok-code-fast-1,xai,model-extraction-relu-logits,1286,737,2023,174.07949,False,0.0,grok-code-fast-1,model-extraction-relu-logits,174.07949,False,0.0,False,174.07949 +e9eb0c87-6b8c-43df-8784-3b95411ad258,claude-opus-4-1-20250805,anthropic,large-scale-text-editing,5753,6940,12693,872.432357,False,0.0,claude-opus-4-1-20250805,large-scale-text-editing,872.432357,False,0.6666666666666666,False,872.432357 +4455e51e-5067-490f-aa31-7f835f910562,grok-4-0709,xai,merge-diff-arc-agi-task,5475,1461,6936,907.250697,False,0.0,grok-4-0709,merge-diff-arc-agi-task,907.250697,False,0.4,False,907.250697 +d6b43375-583f-41ed-be41-3c2ab2f4c6f5,gemini-2.5-pro,gemini,build-initramfs-qemu,5504,2963,8467,595.349904,False,0.0,gemini-2.5-pro,build-initramfs-qemu,595.349904,False,0.0,False,595.349904 +4856feea-0627-412f-862b-7dc26e068df6,gemini-2.5-pro,gemini,build-pov-ray,22166,7302,29468,2019.230885,True,1.0,gemini-2.5-pro,build-pov-ray,2019.230885,True,1.0,True,2019.230885 +2a7c987c-604b-4e93-a45d-9e44554555bd,claude-sonnet-4-20250514,anthropic,reshard-c4-data,7076,5794,12870,451.346809,False,0.0,claude-sonnet-4-20250514,reshard-c4-data,451.346809,False,0.0,False,451.346809 +dc8ff2d4-6f90-481a-870c-b4a6879ef177,gemini-2.5-pro,gemini,hf-model-inference,4170,1664,5834,298.582968,True,1.0,gemini-2.5-pro,hf-model-inference,298.582968,True,0.8,True,298.582968 +56292ed4-7a0f-4cc3-b7bf-7df32bdee0f1,claude-opus-4-1-20250805,anthropic,nginx-request-logging,4659,2125,6784,113.874251,True,1.0,claude-opus-4-1-20250805,nginx-request-logging,113.874251,True,1.0,True,113.874251 +dea1b982-98d8-4ad7-87b9-56a13f6dfb08,gpt-5,openai,install-windows-3.11,4958,1660,6618,227.360665,False,0.0,gpt-5,install-windows-3.11,227.360665,False,0.0,False,227.360665 +7ae7750e-4596-4b03-991b-a81632e6236f,grok-code-fast-1,xai,qemu-alpine-ssh,1439,3500,4939,613.068757,False,0.0,grok-code-fast-1,qemu-alpine-ssh,613.068757,False,0.0,False,613.068757 +a8d8de43-7c71-4506-a1b0-3bcb214dbbc4,OpenAI/gpt-oss-20B,together_ai,code-from-image,272,788,1060,30.53173,False,0.0,OpenAI/gpt-oss-20B,code-from-image,30.53173,False,0.0,False,30.53173 +5a9a9bc2-f373-4173-aa58-215555f92725,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-initramfs-qemu,28015,8949,36964,902.984272,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-initramfs-qemu,902.984272,False,0.0,False,902.984272 +cfd431b1-27ad-4425-9d64-2a9bf2fe1dd7,gpt-5-nano,openai,large-scale-text-editing,6731,6254,12985,1202.879457,False,0.0,gpt-5-nano,large-scale-text-editing,1202.879457,False,0.0,False,1202.879457 +5c3ba37e-1a50-43fb-a46f-424b10803bc6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-pov-ray,15372,9929,25301,1993.775304,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-pov-ray,1993.775304,False,0.2,False,1993.775304 +de079411-a6b5-4929-ab67-eb1cd8cf93b7,moonshotai/Kimi-K2-Instruct-0905,together_ai,winning-avg-corewars,21041,25269,46310,2882.272548,False,0.0,moonshotai/Kimi-K2-Instruct-0905,winning-avg-corewars,2882.272548,False,0.0,False,2882.272548 +0395eb15-b3bd-4af3-b376-9966e50c71f2,openai/gpt-oss-120b,together_ai,extract-elf,1842,1563,3405,102.883306,False,0.0,openai/gpt-oss-120b,extract-elf,102.883306,False,0.4,False,102.883306 +8f7f5dec-c11c-4fe9-a8e4-37d36ca0e51a,claude-opus-4-1-20250805,anthropic,torch-tensor-parallelism,4677,3598,8275,801.718159,False,0.0,claude-opus-4-1-20250805,torch-tensor-parallelism,801.718159,False,0.0,False,801.718159 +c8adcce5-e091-4495-a5df-1078aa0d4142,gpt-5-mini,openai,prove-plus-comm,1477,898,2375,172.618389,False,0.0,gpt-5-mini,prove-plus-comm,172.618389,False,0.6,False,172.618389 +48d930a6-c9db-436f-9676-5908dd4cb973,claude-opus-4-1-20250805,anthropic,chess-best-move,7235,5569,12804,389.608364,False,0.0,claude-opus-4-1-20250805,chess-best-move,389.608364,False,0.0,False,389.608364 +3ef19d39-df32-499c-a71c-2ee8e6e194f9,gpt-5-nano,openai,build-cython-ext,11200,4620,15820,911.589764,False,0.0,gpt-5-nano,build-cython-ext,911.589764,False,0.0,False,911.589764 +9ce94d87-efc2-4f01-8025-e6089d5857c6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,cancel-async-tasks,8419,7334,15753,766.124338,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,cancel-async-tasks,766.124338,False,0.6,False,766.124338 +d62fa252-d44c-4462-9afd-6b12751c39f1,claude-opus-4-1-20250805,anthropic,tune-mjcf,5443,3965,9408,245.90741,True,1.0,claude-opus-4-1-20250805,tune-mjcf,245.90741,True,0.25,True,245.90741 +26094bb4-1976-4d2d-b45c-b91dcc088929,openai/gpt-oss-120b,together_ai,run-pdp11-code,3639,2503,6142,275.998361,False,0.0,openai/gpt-oss-120b,run-pdp11-code,275.998361,False,0.0,False,275.998361 +d1c33182-4f99-4162-9ac4-2694a2e36faf,OpenAI/gpt-oss-20B,together_ai,pypi-server,6757,14371,21128,494.924042,False,0.0,OpenAI/gpt-oss-20B,pypi-server,494.924042,False,0.2,False,494.924042 +536aeaca-c74a-4305-8323-bc75ad04e2d5,grok-4-0709,xai,code-from-image,7164,5170,12334,1200.045356,False,0.0,grok-4-0709,code-from-image,1200.045356,False,0.0,False,1200.045356 +aa3d5da6-d0f9-4282-98fb-85558f318e93,grok-code-fast-1,xai,sqlite-db-truncate,1827,1912,3739,206.492458,False,0.0,grok-code-fast-1,sqlite-db-truncate,206.492458,False,0.0,False,206.492458 +a35c3618-39e1-4a3e-a414-4e8c4336b4d4,grok-4-0709,xai,dna-insert,964,242,1206,434.963809,False,0.0,grok-4-0709,dna-insert,434.963809,False,0.0,False,434.963809 +47376a96-6e41-4876-b0ae-f7cd1f84e43d,claude-opus-4-1-20250805,anthropic,sqlite-with-gcov,9379,1806,11185,221.163788,True,1.0,claude-opus-4-1-20250805,sqlite-with-gcov,221.163788,True,0.5714285714285714,True,221.163788 +72ff3a25-d182-4c34-a2dd-ae5a9b8d765c,openai/gpt-oss-120b,together_ai,sqlite-with-gcov,1221,952,2173,373.045597,True,1.0,openai/gpt-oss-120b,sqlite-with-gcov,373.045597,True,0.8,True,373.045597 +05aa6231-d140-4980-9f9a-48de61adf1c7,gemini-2.5-pro,gemini,chess-best-move,10040,2358,12398,658.742946,False,0.0,gemini-2.5-pro,chess-best-move,658.742946,False,0.0,False,658.742946 +5f7e7074-edc2-48c1-b771-572113e7a02b,OpenAI/gpt-oss-20B,together_ai,count-dataset-tokens,4132,11335,15467,904.826627,False,0.0,OpenAI/gpt-oss-20B,count-dataset-tokens,904.826627,False,0.0,False,904.826627 +48f6b31b-e463-4816-8d8e-1aa58eb9cc92,gpt-5-mini,openai,cobol-modernization,6709,4440,11149,262.038942,True,1.0,gpt-5-mini,cobol-modernization,262.038942,True,1.0,True,262.038942 +15b7bc11-8cfd-49b9-84ac-7e79cdda30cc,claude-sonnet-4-20250514,anthropic,path-tracing,5272,5454,10726,579.820103,False,0.0,claude-sonnet-4-20250514,path-tracing,579.820103,False,0.0,False,579.820103 +f3c34cdd-6d9f-4117-b0f3-f15ac9b65381,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-cython-ext,20128,6306,26434,913.907689,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-cython-ext,913.907689,False,0.0,False,913.907689 +1fa04da8-c87c-4ea9-8e91-f0686cb9f198,claude-opus-4-1-20250805,anthropic,write-compressor,8295,10500,18795,1261.303716,False,0.0,claude-opus-4-1-20250805,write-compressor,1261.303716,False,0.0,False,1261.303716 +f08ccb40-eb68-4e21-a713-7ff8d95324a6,grok-code-fast-1,xai,bn-fit-modify,10097,6003,16100,1107.363996,False,0.0,grok-code-fast-1,bn-fit-modify,1107.363996,False,0.0,False,1107.363996 +426c4365-5cf9-4b6b-8529-2c294aebdd07,claude-sonnet-4-20250514,anthropic,constraints-scheduling,5124,3094,8218,403.9593,True,1.0,claude-sonnet-4-20250514,constraints-scheduling,403.9593,True,1.0,True,403.9593 +457db808-3feb-4f3b-b00b-07d11365529f,grok-4-0709,xai,polyglot-c-py,1161,833,1994,606.481813,True,1.0,grok-4-0709,polyglot-c-py,606.481813,True,0.6,True,606.481813 +f4bdb963-1997-4d0a-8244-17c79ab3529f,OpenAI/gpt-oss-20B,together_ai,polyglot-c-py,516,781,1297,169.126195,False,0.0,OpenAI/gpt-oss-20B,polyglot-c-py,169.126195,False,0.0,False,169.126195 +eccd6e7a-5624-422c-bd9e-a779204856e7,claude-opus-4-1-20250805,anthropic,configure-git-webserver,6682,1842,8524,506.423469,True,1.0,claude-opus-4-1-20250805,configure-git-webserver,506.423469,True,0.625,True,506.423469 +4e79cccb-31ed-4c37-8513-1b85cffe9dc7,claude-opus-4-1-20250805,anthropic,openssl-selfsigned-cert,3475,2632,6107,88.764477,True,1.0,claude-opus-4-1-20250805,openssl-selfsigned-cert,88.764477,True,1.0,True,88.764477 +90e44b13-db81-454d-a0b6-75396a5916e7,zai-org/GLM-4.5-Air-FP8,together_ai,build-pov-ray,15619,4834,20453,804.24679,False,0.0,zai-org/GLM-4.5-Air-FP8,build-pov-ray,804.24679,False,0.0,False,804.24679 +1c5ab240-e32c-48b1-a66a-af9be0cd584d,gpt-5-mini,openai,pytorch-model-recovery,14435,21191,35626,855.838254,False,0.0,gpt-5-mini,pytorch-model-recovery,855.838254,False,0.0,False,855.838254 +20fc7cb0-8454-4ba0-a77a-157fb48e2dce,gpt-5-nano,openai,configure-git-webserver,6591,3451,10042,364.123252,False,0.0,gpt-5-nano,configure-git-webserver,364.123252,False,0.2,False,364.123252 +f4408203-2fa1-4ff7-8a1e-789b09c7e567,OpenAI/gpt-oss-20B,together_ai,port-compressor,7996,32980,40976,3600.039148,False,0.0,OpenAI/gpt-oss-20B,port-compressor,3600.039148,False,0.0,False,3600.039148 +06ae0449-cb21-42bb-b9d0-7044203d03c5,openai/gpt-oss-120b,together_ai,vulnerable-secret,12916,4989,17905,382.465756,False,0.0,openai/gpt-oss-120b,vulnerable-secret,382.465756,False,0.0,False,382.465756 +f096ea2b-5bf4-4561-9ac0-ada3f19112c0,claude-opus-4-1-20250805,anthropic,dna-assembly,18501,11908,30409,754.891937,False,0.0,claude-opus-4-1-20250805,dna-assembly,754.891937,False,0.0,False,754.891937 +a71ed3c3-4eb6-46c1-9fd6-859ac6b67f17,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-db-truncate,6650,4009,10659,152.114013,False,0.0,deepseek-ai/DeepSeek-V3.1,sqlite-db-truncate,152.114013,False,0.0,False,152.114013 +1cba150c-69a1-416e-b05a-0bf94c6090a3,gemini-2.5-pro,gemini,adaptive-rejection-sampler,11138,11923,23061,774.267194,False,0.0,gemini-2.5-pro,adaptive-rejection-sampler,774.267194,False,0.4,False,774.267194 +10e26a28-f40f-49f6-8451-d10717827599,gpt-5,openai,cobol-modernization,6816,3752,10568,434.831796,True,1.0,gpt-5,cobol-modernization,434.831796,True,1.0,True,434.831796 +03e402fe-73c6-4072-9199-8e51be1bf986,gemini-2.5-pro,gemini,db-wal-recovery,30292,8635,38927,902.236578,False,0.0,gemini-2.5-pro,db-wal-recovery,902.236578,False,0.0,False,902.236578 +0000900d-99a6-492a-b6cc-dc3a02a8e29b,openai/gpt-oss-120b,together_ai,dna-assembly,5573,791,6364,73.196696,False,0.0,openai/gpt-oss-120b,dna-assembly,73.196696,False,0.0,False,73.196696 +94aeadb8-7ef8-464c-9e36-42b9da372884,claude-sonnet-4-20250514,anthropic,db-wal-recovery,3544,4294,7838,261.830652,False,0.0,claude-sonnet-4-20250514,db-wal-recovery,261.830652,False,0.0,False,261.830652 +dbba3f65-b266-4c37-aa6f-b6c915c8b4da,gpt-5,openai,db-wal-recovery,6175,7719,13894,1014.428489,False,0.0,gpt-5,db-wal-recovery,1014.428489,False,0.1428571428571428,False,1014.428489 +10699f84-e9ae-4c9c-a0b2-34545eacd4ca,gpt-5-mini,openai,fix-code-vulnerability,4853,13650,18503,904.18628,False,0.0,gpt-5-mini,fix-code-vulnerability,904.18628,False,0.0,False,904.18628 +70b4e21e-58cc-4ec5-bf06-754283ad6206,claude-sonnet-4-20250514,anthropic,reshard-c4-data,8688,7324,16012,495.955441,False,0.0,claude-sonnet-4-20250514,reshard-c4-data,495.955441,False,0.0,False,495.955441 +e28002c8-4c83-49a5-babc-4fad55afb951,gpt-5,openai,extract-elf,2500,1794,4294,198.657689,True,1.0,gpt-5,extract-elf,198.657689,True,0.2857142857142857,True,198.657689 +9bd77213-0756-4acc-85fa-af067cfada7a,gemini-2.5-pro,gemini,gpt2-codegolf,5286,6556,11842,900.01824,False,0.0,gemini-2.5-pro,gpt2-codegolf,900.01824,False,0.0,False,900.01824 +5f747fbc-102a-4372-84f4-b69ca27ebd17,claude-sonnet-4-20250514,anthropic,path-tracing,7512,8830,16342,688.470896,False,0.0,claude-sonnet-4-20250514,path-tracing,688.470896,False,0.0,False,688.470896 +6e48a98e-8902-45dc-8006-d0f97c9d8fd8,gemini-2.5-pro,gemini,code-from-image,5642,1410,7052,185.239353,True,1.0,gemini-2.5-pro,code-from-image,185.239353,True,1.0,True,185.239353 +973963fd-f94f-415a-b01e-003830f865e5,deepseek-ai/DeepSeek-V3.1,together_ai,video-processing,3895,3483,7378,108.320554,False,0.0,deepseek-ai/DeepSeek-V3.1,video-processing,108.320554,False,0.0,False,108.320554 +8e1c3119-8c53-4383-a134-0eed538f5368,grok-code-fast-1,xai,polyglot-rust-c,1255,711,1966,60.939518,False,0.0,grok-code-fast-1,polyglot-rust-c,60.939518,False,0.0,False,60.939518 +fa83b1c4-cf59-4efe-ae1f-3f3d9f935f3a,zai-org/GLM-4.5-Air-FP8,together_ai,cobol-modernization,8227,6846,15073,446.492221,False,0.0,zai-org/GLM-4.5-Air-FP8,cobol-modernization,446.492221,False,0.4,False,446.492221 +d29570e7-ac70-457a-b457-122d9963dad6,gemini-2.5-flash,gemini,git-leak-recovery,11400,3827,15227,525.141885,True,1.0,gemini-2.5-flash,git-leak-recovery,525.141885,True,0.6,True,525.141885 +2b29ddb6-ccea-4ba3-bd42-0108506e496f,gemini-2.5-pro,gemini,reverse-engineering,14003,8711,22714,1803.890926,False,0.0,gemini-2.5-pro,reverse-engineering,1803.890926,False,0.0,False,1803.890926 +ef6066a3-c2a6-4abf-8e63-0af602aa0257,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-cython-ext,12022,4307,16329,913.170316,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-cython-ext,913.170316,False,0.0,False,913.170316 +b88074c6-bcff-41b7-b324-bfec10242d44,claude-sonnet-4-20250514,anthropic,reverse-engineering,17647,8985,26632,1809.554577,False,0.0,claude-sonnet-4-20250514,reverse-engineering,1809.554577,False,0.0,False,1809.554577 +6ace35a6-8943-44fe-ab50-12a804888879,deepseek-ai/DeepSeek-V3.1,together_ai,build-initramfs-qemu,7014,5203,12217,900.263867,False,0.0,deepseek-ai/DeepSeek-V3.1,build-initramfs-qemu,900.263867,False,0.0,False,900.263867 +59691d87-6fbe-43f6-830a-d285dc5fcfb6,gpt-5-nano,openai,bn-fit-modify,6121,5554,11675,385.591483,False,0.0,gpt-5-nano,bn-fit-modify,385.591483,False,0.0,False,385.591483 +413c3716-d159-4468-9946-22a68b37ec0e,grok-code-fast-1,xai,run-pdp11-code,5879,1507,7386,175.930435,False,0.0,grok-code-fast-1,run-pdp11-code,175.930435,False,0.0,False,175.930435 +7a156489-ea08-4fc5-9b15-b169c9fde7cf,claude-sonnet-4-20250514,anthropic,count-dataset-tokens,19900,6009,25909,708.12527,False,0.0,claude-sonnet-4-20250514,count-dataset-tokens,708.12527,False,0.0,False,708.12527 +7bd796df-e2b8-4d9e-9ba7-79fcc6617b53,OpenAI/gpt-oss-20B,together_ai,adaptive-rejection-sampler,223,2417,2640,155.80654,False,0.0,OpenAI/gpt-oss-20B,adaptive-rejection-sampler,155.80654,False,0.0,False,155.80654 +8409492e-3e5a-4190-bb25-d05402226df8,OpenAI/gpt-oss-20B,together_ai,schemelike-metacircular-eval,2433,5672,8105,176.998226,False,0.0,OpenAI/gpt-oss-20B,schemelike-metacircular-eval,176.998226,False,0.0,False,176.998226 +f2064a7b-49fb-4cb6-b408-c9d3ee119f8f,zai-org/GLM-4.5-Air-FP8,together_ai,hf-model-inference,3908,2219,6127,92.532709,True,1.0,zai-org/GLM-4.5-Air-FP8,hf-model-inference,92.532709,True,0.8,True,92.532709 +cc1ef134-4987-46d1-bc2d-2913800c592c,gpt-5-mini,openai,sqlite-db-truncate,1895,1712,3607,68.423957,False,0.0,gpt-5-mini,sqlite-db-truncate,68.423957,False,0.0,False,68.423957 +c37c39e4-0c7a-46e9-819c-a37f9027b20a,claude-sonnet-4-20250514,anthropic,model-extraction-relu-logits,2234,1653,3887,1420.753144,False,0.0,claude-sonnet-4-20250514,model-extraction-relu-logits,1420.753144,False,0.0,False,1420.753144 +52738a4c-dc37-41c8-85c8-19b5dcbe35c0,deepseek-ai/DeepSeek-V3.1,together_ai,fix-code-vulnerability,6507,1287,7794,1009.212331,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-code-vulnerability,1009.212331,False,0.2,False,1009.212331 +8da9f4bf-1222-4d0a-b6fa-fc34823bf024,claude-opus-4-1-20250805,anthropic,pytorch-model-recovery,8092,4718,12810,309.337275,True,1.0,claude-opus-4-1-20250805,pytorch-model-recovery,309.337275,True,1.0,True,309.337275 +a717d196-ee77-4c28-a6ae-b8c6f3463115,grok-4-0709,xai,nginx-request-logging,3705,1099,4804,277.766512,True,1.0,grok-4-0709,nginx-request-logging,277.766512,True,1.0,True,277.766512 +1114b076-eb58-463a-8d8e-ba0484ee3dbf,openai/gpt-oss-120b,together_ai,configure-git-webserver,4490,1456,5946,568.77527,False,0.0,openai/gpt-oss-120b,configure-git-webserver,568.77527,False,0.6,False,568.77527 +3ce1c433-dc09-475f-91f8-1c9bf1adc942,OpenAI/gpt-oss-20B,together_ai,pypi-server,2969,955,3924,207.007948,True,1.0,OpenAI/gpt-oss-20B,pypi-server,207.007948,True,0.2,True,207.007948 +3a8d151e-ffac-43d4-8e25-f1e9c3240654,claude-opus-4-1-20250805,anthropic,winning-avg-corewars,13298,9583,22881,951.561942,True,1.0,claude-opus-4-1-20250805,winning-avg-corewars,951.561942,True,0.3333333333333333,True,951.561942 +5751c21c-5cf6-40d9-897f-7082225a2b12,deepseek-ai/DeepSeek-V3.1,together_ai,form-filling,8259,7241,15500,478.384476,True,1.0,deepseek-ai/DeepSeek-V3.1,form-filling,478.384476,True,0.8,True,478.384476 +fd21b178-e94e-457e-843d-0fa650c40962,gpt-5-nano,openai,qemu-startup,1477,1747,3224,1018.652489,False,0.0,gpt-5-nano,qemu-startup,1018.652489,False,0.0,False,1018.652489 +be73d57f-9a9d-46b0-be33-d67320b4c4f7,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,install-windows-3.11,8699,2124,10823,145.051022,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,install-windows-3.11,145.051022,False,0.0,False,145.051022 +2ad9b966-70af-4825-aba7-d63b3d0fd403,moonshotai/Kimi-K2-Instruct-0905,together_ai,large-scale-text-editing,7715,7846,15561,1201.332374,False,0.0,moonshotai/Kimi-K2-Instruct-0905,large-scale-text-editing,1201.332374,False,0.0,False,1201.332374 +cd6f129c-7664-4a93-9856-b4e79ca1e6e8,gpt-5-mini,openai,code-from-image,12431,12623,25054,1217.799886,False,0.0,gpt-5-mini,code-from-image,1217.799886,False,0.0,False,1217.799886 +6d8ef277-cebf-41e1-80ac-45f337a26299,OpenAI/gpt-oss-20B,together_ai,merge-diff-arc-agi-task,634,1468,2102,128.028064,False,0.0,OpenAI/gpt-oss-20B,merge-diff-arc-agi-task,128.028064,False,0.0,False,128.028064 +b39ba18e-5c9b-466f-af75-b92ae040c483,OpenAI/gpt-oss-20B,together_ai,log-summary-date-ranges,159,1940,2099,248.833063,False,0.0,OpenAI/gpt-oss-20B,log-summary-date-ranges,248.833063,False,0.0,False,248.833063 +82e5ca76-e88d-4512-ab10-463cd62c7ed4,gpt-5-mini,openai,form-filling,4200,2709,6909,202.965418,True,1.0,gpt-5-mini,form-filling,202.965418,True,1.0,True,202.965418 +2a511ec9-bd36-4719-83f6-424e27fcff43,gemini-2.5-pro,gemini,reverse-engineering,11216,6673,17889,1502.86234,False,0.0,gemini-2.5-pro,reverse-engineering,1502.86234,False,0.0,False,1502.86234 +d839a4cb-e28c-48da-98ef-2b7f389cb7b7,gpt-5-mini,openai,openssl-selfsigned-cert,1959,2004,3963,224.869563,True,1.0,gpt-5-mini,openssl-selfsigned-cert,224.869563,True,0.8,True,224.869563 +7b78c7f2-6063-4274-8d97-2c2d986f1ce2,deepseek-ai/DeepSeek-V3.1,together_ai,path-tracing-reverse,16628,11556,28184,872.788249,False,0.0,deepseek-ai/DeepSeek-V3.1,path-tracing-reverse,872.788249,False,0.2,False,872.788249 +991c71d4-dd46-4f68-bd3e-ab35eb931a52,gpt-5-mini,openai,port-compressor,15700,26002,41702,3626.957065,False,0.0,gpt-5-mini,port-compressor,3626.957065,False,0.0,False,3626.957065 +c7ab5712-aff6-4792-8105-3358b797720b,grok-code-fast-1,xai,feal-linear-cryptanalysis,9715,6790,16505,625.302822,False,0.0,grok-code-fast-1,feal-linear-cryptanalysis,625.302822,False,0.0,False,625.302822 +768daabf-6d64-4c42-bbf4-3746519d38ee,deepseek-ai/DeepSeek-V3.1,together_ai,dna-assembly,5375,4924,10299,257.260316,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-assembly,257.260316,False,0.0,False,257.260316 +379d7a79-ec80-46da-9518-1cae88098209,gemini-2.5-pro,gemini,fix-git,2567,1627,4194,141.68754,True,1.0,gemini-2.5-pro,fix-git,141.68754,True,1.0,True,141.68754 +b379b986-867b-494f-a689-4593c27d383f,gemini-2.5-pro,gemini,port-compressor,25531,35833,61364,3564.083488,False,0.0,gemini-2.5-pro,port-compressor,3564.083488,False,0.0,False,3564.083488 +961d6353-b25e-411f-b7a5-a4df1af2ffaa,moonshotai/Kimi-K2-Instruct-0905,together_ai,pypi-server,6634,4636,11270,249.04196,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pypi-server,249.04196,False,0.2,False,249.04196 +499420d3-3e08-4f92-bb70-765a7187a3ad,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,circuit-fibsqrt,15356,15719,31075,1684.166755,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,circuit-fibsqrt,1684.166755,False,0.0,False,1684.166755 +64986aa9-fbd0-4208-bbd0-bc088a3849ac,claude-sonnet-4-20250514,anthropic,make-doom-for-mips,15414,5907,21321,943.464124,False,0.0,claude-sonnet-4-20250514,make-doom-for-mips,943.464124,False,0.0,False,943.464124 +339da028-8c2d-443d-b471-07c917afb1b4,claude-sonnet-4-20250514,anthropic,schemelike-metacircular-eval,20787,14814,35601,557.23096,False,0.0,claude-sonnet-4-20250514,schemelike-metacircular-eval,557.23096,False,0.0,False,557.23096 +f73ca943-2986-4039-bf97-bfa98b99fc0c,grok-code-fast-1,xai,fix-code-vulnerability,5936,2365,8301,928.578719,False,0.0,grok-code-fast-1,fix-code-vulnerability,928.578719,False,0.0,False,928.578719 +9255d4c7-9963-4b2b-a0c7-252619f1afcf,claude-sonnet-4-20250514,anthropic,torch-tensor-parallelism,6715,4666,11381,344.673573,False,0.0,claude-sonnet-4-20250514,torch-tensor-parallelism,344.673573,False,0.0,False,344.673573 +efadf707-8168-4c10-94b3-b2a8c5125c4e,grok-code-fast-1,xai,train-fasttext,7821,5238,13059,2080.614079,False,0.0,grok-code-fast-1,train-fasttext,2080.614079,False,0.0,False,2080.614079 +8d60cb79-0ef3-40ce-9f9e-b842c69a3e02,grok-4-0709,xai,vulnerable-secret,5962,1771,7733,923.415844,True,1.0,grok-4-0709,vulnerable-secret,923.415844,True,0.6,True,923.415844 +41f87aee-0fc6-46ac-ab22-e27d65a7d3d3,gpt-5-nano,openai,break-filter-js-from-html,8918,11846,20764,1200.937706,False,0.0,gpt-5-nano,break-filter-js-from-html,1200.937706,False,0.0,False,1200.937706 +1f32547e-f906-4a8e-8c53-b29d9adae5dc,gemini-2.5-flash,gemini,vulnerable-secret,2190,3440,5630,906.549594,False,0.0,gemini-2.5-flash,vulnerable-secret,906.549594,False,0.0,False,906.549594 +d53e6d3c-524c-4dd4-9b99-8f433c6dc90b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,large-scale-text-editing,7664,8311,15975,1200.509594,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,large-scale-text-editing,1200.509594,False,0.0,False,1200.509594 +06e755b3-0d5a-4057-988e-3546ad18a8cb,gemini-2.5-pro,gemini,qemu-alpine-ssh,1952,2022,3974,439.323477,False,0.0,gemini-2.5-pro,qemu-alpine-ssh,439.323477,False,0.2,False,439.323477 +52995888-e2ab-4bff-9bdb-6a54fe5404c8,zai-org/GLM-4.5-Air-FP8,together_ai,constraints-scheduling,6418,6453,12871,360.917783,True,1.0,zai-org/GLM-4.5-Air-FP8,constraints-scheduling,360.917783,True,0.8,True,360.917783 +434b8a92-ba4a-4dd3-9454-a86c668d7c43,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing,3112,3862,6974,95.967614,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing,95.967614,False,0.0,False,95.967614 +dee41e04-1644-4de3-b5b1-c46cc1df7635,openai/gpt-oss-120b,together_ai,password-recovery,3393,5190,8583,900.797521,False,0.0,openai/gpt-oss-120b,password-recovery,900.797521,False,0.2,False,900.797521 +c0bb5b47-b93d-4695-8b2f-a9afc96ca21b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-linear-cryptanalysis,15333,16063,31396,1801.035769,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-linear-cryptanalysis,1801.035769,False,0.0,False,1801.035769 +2229f55e-8f95-418b-bd52-cc330212ddc3,gpt-5,openai,pytorch-model-cli,2442,3296,5738,900.00065,False,0.0,gpt-5,pytorch-model-cli,900.00065,False,0.0,False,900.00065 +5f234901-445e-482f-8ce2-e9e2a082a74c,claude-sonnet-4-20250514,anthropic,form-filling,9684,7575,17259,338.867321,True,1.0,claude-sonnet-4-20250514,form-filling,338.867321,True,1.0,True,338.867321 +199dea09-10b2-4261-9fd7-ae045ebd6b73,gpt-5,openai,qemu-alpine-ssh,1316,1532,2848,461.559064,False,0.0,gpt-5,qemu-alpine-ssh,461.559064,False,0.1666666666666666,False,461.559064 +136ae080-81a7-401e-9e66-8b9df4b662ed,grok-code-fast-1,xai,path-tracing,3168,1692,4860,864.613321,False,0.0,grok-code-fast-1,path-tracing,864.613321,False,0.0,False,864.613321 +3b6709e6-cfa4-4551-b376-fb7c2966129b,gpt-5-mini,openai,code-from-image,33357,21914,55271,1200.001952,False,0.0,gpt-5-mini,code-from-image,1200.001952,False,0.0,False,1200.001952 +9dfd5c5f-a61c-4daf-9bdf-5643c5ae6a7a,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-initramfs-qemu,19043,6350,25393,526.349524,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-initramfs-qemu,526.349524,False,0.0,False,526.349524 +5e79216e-c42a-4949-9f33-65582bed2132,gemini-2.5-flash,gemini,fix-ocaml-gc,59701,41262,100963,3600.002398,False,0.0,gemini-2.5-flash,fix-ocaml-gc,3600.002398,False,0.0,False,3600.002398 +1c2a7380-3c92-49e6-aed3-366ab1a18c98,deepseek-ai/DeepSeek-V3.1,together_ai,pytorch-model-recovery,15482,9100,24582,706.758314,True,1.0,deepseek-ai/DeepSeek-V3.1,pytorch-model-recovery,706.758314,True,0.6,True,706.758314 +5de96757-f791-4e8e-bad9-4fd5e5dc3448,gemini-2.5-flash,gemini,train-fasttext,31457,11723,43180,3643.970918,False,0.0,gemini-2.5-flash,train-fasttext,3643.970918,False,0.0,False,3643.970918 +8c08453a-ae7c-47fe-bfd1-5a2282d00205,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,mteb-leaderboard,27048,4819,31867,468.001021,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,mteb-leaderboard,468.001021,False,0.0,False,468.001021 +8b4b606c-bceb-41b8-a19f-8a7c2281a790,gemini-2.5-pro,gemini,pytorch-model-cli,7510,2385,9895,346.949304,False,0.0,gemini-2.5-pro,pytorch-model-cli,346.949304,False,0.4,False,346.949304 +70a666d1-0963-4c10-a6c3-291b59275f5b,grok-code-fast-1,xai,reverse-engineering,5846,2282,8128,567.980075,False,0.0,grok-code-fast-1,reverse-engineering,567.980075,False,0.0,False,567.980075 +e16faf66-75d5-4309-b8d8-3741e7002606,gemini-2.5-flash,gemini,path-tracing,2417,1931,4348,273.498202,False,0.0,gemini-2.5-flash,path-tracing,273.498202,False,0.0,False,273.498202 +c91d7024-e738-4612-a9fb-42a566d2e481,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing,43668,15354,59022,1045.947678,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing,1045.947678,False,0.0,False,1045.947678 +14cf5a59-e1c1-4fa4-9511-8811bb56b711,deepseek-ai/DeepSeek-V3.1,together_ai,dna-assembly,12906,9134,22040,720.039977,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-assembly,720.039977,False,0.0,False,720.039977 +7254b1bb-c27f-413b-b258-903a6674bc41,deepseek-ai/DeepSeek-V3.1,together_ai,make-mips-interpreter,27568,20728,48296,1478.041645,False,0.0,deepseek-ai/DeepSeek-V3.1,make-mips-interpreter,1478.041645,False,0.0,False,1478.041645 +b6ef5f8f-7e31-4183-b93a-0bd1823cad74,gpt-5-nano,openai,count-dataset-tokens,12215,5765,17980,907.084235,False,0.0,gpt-5-nano,count-dataset-tokens,907.084235,False,0.0,False,907.084235 +87f93bdc-15b6-407a-9a72-63146b4e26ed,openai/gpt-oss-120b,together_ai,openssl-selfsigned-cert,1819,1012,2831,64.629051,True,1.0,openai/gpt-oss-120b,openssl-selfsigned-cert,64.629051,True,0.8,True,64.629051 +0df821ee-96c3-4a3d-9f11-d69aadecfbaf,gpt-5,openai,dna-insert,4882,4980,9862,362.328948,False,0.0,gpt-5,dna-insert,362.328948,False,0.0,False,362.328948 +4e02c6f8-3e1e-487e-a557-7a164bf22323,gpt-5,openai,mteb-leaderboard,14410,13200,27610,965.411028,False,0.0,gpt-5,mteb-leaderboard,965.411028,False,0.0,False,965.411028 +96d1b96b-e346-4460-a737-a4d5f73c8e8a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,wasm-pipeline,11574,3486,15060,573.818803,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,wasm-pipeline,573.818803,False,0.0,False,573.818803 +3f004be1-e93e-460d-97e2-c5a20559ee7d,zai-org/GLM-4.5-Air-FP8,together_ai,openssl-selfsigned-cert,1349,2351,3700,91.605442,False,0.0,zai-org/GLM-4.5-Air-FP8,openssl-selfsigned-cert,91.605442,False,0.0,False,91.605442 +6b3784ec-ec17-482c-92d8-89a5624f7112,gemini-2.5-pro,gemini,install-klee-minimal,15492,2323,17815,901.982227,False,0.0,gemini-2.5-pro,install-klee-minimal,901.982227,False,0.0,False,901.982227 +989da270-4ef2-47f7-9154-9bf999730fdc,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-rust-c,7137,8485,15622,909.688541,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-rust-c,909.688541,False,0.0,False,909.688541 +66137536-1a88-40ad-8f67-72d64ed280be,gpt-5,openai,constraints-scheduling,5013,3432,8445,153.199702,True,1.0,gpt-5,constraints-scheduling,153.199702,True,0.8571428571428571,True,153.199702 +b3e296e4-824d-4dbc-af37-0729ce40ce4b,openai/gpt-oss-120b,together_ai,sqlite-with-gcov,1209,925,2134,247.866984,True,1.0,openai/gpt-oss-120b,sqlite-with-gcov,247.866984,True,0.8,True,247.866984 +46fd2c8a-b6a2-4cfd-b783-7599c0d4faf0,openai/gpt-oss-120b,together_ai,torch-tensor-parallelism,2913,4553,7466,590.599073,False,0.0,openai/gpt-oss-120b,torch-tensor-parallelism,590.599073,False,0.0,False,590.599073 +283d25bc-2e79-4301-840e-698575cec4e6,grok-code-fast-1,xai,port-compressor,13784,19328,33112,1162.637823,False,0.0,grok-code-fast-1,port-compressor,1162.637823,False,0.0,False,1162.637823 +93e21952-23fc-4698-9919-a843da9ee341,moonshotai/Kimi-K2-Instruct-0905,together_ai,filter-js-from-html,3521,3352,6873,335.55509,False,0.0,moonshotai/Kimi-K2-Instruct-0905,filter-js-from-html,335.55509,False,0.0,False,335.55509 +bf25fe96-a679-445e-b299-25ffc963e6a0,gemini-2.5-pro,gemini,model-extraction-relu-logits,4561,1724,6285,556.541947,False,0.0,gemini-2.5-pro,model-extraction-relu-logits,556.541947,False,0.0,False,556.541947 +5ecf2fc0-3c49-44b6-9e73-dbaed520130d,gemini-2.5-flash,gemini,constraints-scheduling,5540,3658,9198,492.901699,False,0.0,gemini-2.5-flash,constraints-scheduling,492.901699,False,0.4,False,492.901699 +cc8c841a-774e-4ea9-b732-fafa8c12cb81,claude-sonnet-4-20250514,anthropic,qemu-alpine-ssh,1308,921,2229,1009.371395,False,0.0,claude-sonnet-4-20250514,qemu-alpine-ssh,1009.371395,False,0.6,False,1009.371395 +1aebe770-0355-487b-9581-e63b532da6c9,grok-4-0709,xai,sanitize-git-repo,13048,1934,14982,705.613592,False,0.0,grok-4-0709,sanitize-git-repo,705.613592,False,0.0,False,705.613592 +e223545b-6ae5-4184-9871-d0a4cb936399,gpt-5-mini,openai,model-extraction-relu-logits,2080,1663,3743,219.411444,False,0.0,gpt-5-mini,model-extraction-relu-logits,219.411444,False,0.0,False,219.411444 +171624f6-7681-47a6-830f-0ebd546b2047,zai-org/GLM-4.5-Air-FP8,together_ai,fix-git,15979,7714,23693,920.482572,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-git,920.482572,False,0.6,False,920.482572 +415cdd03-528d-4b67-a938-a898df6e9557,zai-org/GLM-4.5-Air-FP8,together_ai,model-extraction-relu-logits,12815,9426,22241,775.494639,True,1.0,zai-org/GLM-4.5-Air-FP8,model-extraction-relu-logits,775.494639,True,0.2,True,775.494639 +2f48f6d3-9a5c-4470-bcc6-965701171f94,zai-org/GLM-4.5-Air-FP8,together_ai,wasm-pipeline,14328,9787,24115,901.235036,False,0.0,zai-org/GLM-4.5-Air-FP8,wasm-pipeline,901.235036,False,0.2,False,901.235036 +1b54179d-a9d4-4225-8a79-495a68f3a314,zai-org/GLM-4.5-Air-FP8,together_ai,make-doom-for-mips,17346,3859,21205,920.134017,False,0.0,zai-org/GLM-4.5-Air-FP8,make-doom-for-mips,920.134017,False,0.0,False,920.134017 +c67f451d-6fbc-413a-b078-19d09aa4fff5,claude-opus-4-1-20250805,anthropic,build-cython-ext,17426,5803,23229,819.120516,False,0.0,claude-opus-4-1-20250805,build-cython-ext,819.120516,False,0.0,False,819.120516 +849de4bd-8ee5-4870-a8f0-5e15aa773c50,claude-opus-4-1-20250805,anthropic,form-filling,6360,4331,10691,209.095213,True,1.0,claude-opus-4-1-20250805,form-filling,209.095213,True,1.0,True,209.095213 +6a5d43a0-0fae-4a90-bb79-b4085d7023bb,openai/gpt-oss-120b,together_ai,prove-plus-comm,1371,646,2017,36.75817,True,1.0,openai/gpt-oss-120b,prove-plus-comm,36.75817,True,1.0,True,36.75817 +39a91c9f-52fa-4158-92ce-f51cdf553ba5,OpenAI/gpt-oss-20B,together_ai,train-fasttext,8253,24701,32954,3601.535597,False,0.0,OpenAI/gpt-oss-20B,train-fasttext,3601.535597,False,0.0,False,3601.535597 +d4aae31c-9030-4983-b6f1-163c3ce875e9,deepseek-ai/DeepSeek-V3.1,together_ai,prove-plus-comm,1704,1236,2940,106.915639,True,1.0,deepseek-ai/DeepSeek-V3.1,prove-plus-comm,106.915639,True,1.0,True,106.915639 +7a484c9e-f117-43f9-b0fd-1382ee75bc04,grok-code-fast-1,xai,filter-js-from-html,1152,574,1726,35.77445,False,0.0,grok-code-fast-1,filter-js-from-html,35.77445,False,0.0,False,35.77445 +ab27df81-2b05-45f4-ae2a-7ce61f570c33,gpt-5,openai,adaptive-rejection-sampler,2852,10326,13178,901.473466,False,0.0,gpt-5,adaptive-rejection-sampler,901.473466,False,0.4,False,901.473466 +bfbb578c-3528-4b98-90a3-0c3fd270aacd,claude-opus-4-1-20250805,anthropic,reverse-engineering,29756,12827,42583,1802.352125,False,0.0,claude-opus-4-1-20250805,reverse-engineering,1802.352125,False,0.0,False,1802.352125 +5a865dfe-904d-40eb-8cf8-5673296c732a,zai-org/GLM-4.5-Air-FP8,together_ai,db-wal-recovery,3123,4494,7617,910.573184,False,0.0,zai-org/GLM-4.5-Air-FP8,db-wal-recovery,910.573184,False,0.0,False,910.573184 +120412fd-90b8-40e2-99cf-4ee0a21cec29,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-startup,2073,2007,4080,328.085657,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-startup,328.085657,False,0.0,False,328.085657 +83d5a3ac-f0a9-477f-8ee7-f4d2d74a0c4a,gemini-2.5-pro,gemini,dna-insert,6365,2509,8874,290.502575,False,0.0,gemini-2.5-pro,dna-insert,290.502575,False,0.0,False,290.502575 +1c3ba781-ef0d-4307-88be-4a47b29dd401,claude-sonnet-4-20250514,anthropic,db-wal-recovery,5269,5668,10937,307.527053,False,0.0,claude-sonnet-4-20250514,db-wal-recovery,307.527053,False,0.0,False,307.527053 +bf26c899-a265-41ce-b782-1bfc20651720,openai/gpt-oss-120b,together_ai,qemu-alpine-ssh,3110,5935,9045,951.269345,False,0.0,openai/gpt-oss-120b,qemu-alpine-ssh,951.269345,False,0.0,False,951.269345 +fb5bc37e-1e80-42fb-8a1d-e97fb65dc585,deepseek-ai/DeepSeek-V3.1,together_ai,log-summary-date-ranges,9210,3748,12958,107.215657,False,0.0,deepseek-ai/DeepSeek-V3.1,log-summary-date-ranges,107.215657,False,0.4,False,107.215657 +327719e8-f7ca-450a-a2b4-7816903ae765,moonshotai/Kimi-K2-Instruct-0905,together_ai,db-wal-recovery,2887,3571,6458,127.840978,False,0.0,moonshotai/Kimi-K2-Instruct-0905,db-wal-recovery,127.840978,False,0.0,False,127.840978 +fd6ffe19-2b47-4463-aa15-f2fc1806f720,deepseek-ai/DeepSeek-V3.1,together_ai,hf-model-inference,4502,2011,6513,437.601852,True,1.0,deepseek-ai/DeepSeek-V3.1,hf-model-inference,437.601852,True,0.8,True,437.601852 +27b29555-6dcf-4ae2-bf78-a4001bd1e92a,gpt-5,openai,financial-document-processor,12175,8742,20917,457.32104,False,0.0,gpt-5,financial-document-processor,457.32104,False,0.0,False,457.32104 +9be7fb66-cc9d-43ee-b38a-6691c6ba27b0,gpt-5-nano,openai,sparql-university,2451,3038,5489,933.821437,False,0.0,gpt-5-nano,sparql-university,933.821437,False,0.0,False,933.821437 +fb8ca50c-6998-4f57-bcd8-9fac190b5d7f,gpt-5-nano,openai,build-pov-ray,14754,15409,30163,6004.218408,False,0.0,gpt-5-nano,build-pov-ray,6004.218408,False,0.0,False,6004.218408 +0ed40dd5-8061-4dad-9655-cfc224202cdc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,torch-tensor-parallelism,10900,2036,12936,160.969453,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,torch-tensor-parallelism,160.969453,False,0.0,False,160.969453 +e1e03b63-fe0d-47df-9b7b-3f4195ecd59e,claude-sonnet-4-20250514,anthropic,build-initramfs-qemu,3939,3612,7551,980.620983,False,0.0,claude-sonnet-4-20250514,build-initramfs-qemu,980.620983,False,0.0,False,980.620983 +06ea7903-4d64-4826-b17a-e0d939b40a12,moonshotai/Kimi-K2-Instruct-0905,together_ai,code-from-image,23357,14656,38013,1202.914415,False,0.0,moonshotai/Kimi-K2-Instruct-0905,code-from-image,1202.914415,False,0.6,False,1202.914415 +11e41d76-4685-452a-b9fb-83ff05e2516d,gemini-2.5-pro,gemini,install-klee-minimal,11735,2180,13915,902.006206,False,0.0,gemini-2.5-pro,install-klee-minimal,902.006206,False,0.0,False,902.006206 +be5762e7-756b-44df-a6fc-b975203b3131,gpt-5-nano,openai,tune-mjcf,14208,15528,29736,900.168726,False,0.0,gpt-5-nano,tune-mjcf,900.168726,False,0.0,False,900.168726 +04359fed-7181-4358-9bc1-c287cb91ea2e,grok-code-fast-1,xai,schemelike-metacircular-eval,8496,7036,15532,2458.884372,False,0.0,grok-code-fast-1,schemelike-metacircular-eval,2458.884372,False,0.0,False,2458.884372 +0a84d848-147e-48f2-902d-b1a172df3b38,claude-sonnet-4-20250514,anthropic,fix-code-vulnerability,16059,5640,21699,760.944782,True,1.0,claude-sonnet-4-20250514,fix-code-vulnerability,760.944782,True,0.8,True,760.944782 +2861ea76-0488-4961-8258-ce153dd2c063,gpt-5-nano,openai,write-compressor,2538,1338,3876,284.346443,False,0.0,gpt-5-nano,write-compressor,284.346443,False,0.0,False,284.346443 +89e1f170-07d3-43c8-9b18-f8a4eb41c9d4,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,openssl-selfsigned-cert,2841,2271,5112,166.120489,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,openssl-selfsigned-cert,166.120489,True,0.4,True,166.120489 +98c85ef1-1886-4d04-93a9-36d48e7fa859,claude-sonnet-4-20250514,anthropic,video-processing,5484,4485,9969,284.249982,False,0.0,claude-sonnet-4-20250514,video-processing,284.249982,False,0.0,False,284.249982 +4441684a-f656-4525-b1f5-a1838a6dca24,gemini-2.5-pro,gemini,crack-7z-hash,9440,3459,12899,328.915003,True,1.0,gemini-2.5-pro,crack-7z-hash,328.915003,True,0.8,True,328.915003 +a6bae596-4bf1-4f90-9237-c5b4c5773712,gpt-5,openai,sanitize-git-repo,7698,3689,11387,916.477618,False,0.0,gpt-5,sanitize-git-repo,916.477618,False,0.2857142857142857,False,916.477618 +ff555fb1-798c-4c2b-b26a-150666b8168e,openai/gpt-oss-120b,together_ai,make-mips-interpreter,30564,41371,71935,1805.902352,False,0.0,openai/gpt-oss-120b,make-mips-interpreter,1805.902352,False,0.0,False,1805.902352 +a6adc374-afbf-4a74-8100-eb78326711ea,gpt-5,openai,torch-tensor-parallelism,2961,4141,7102,234.572263,False,0.0,gpt-5,torch-tensor-parallelism,234.572263,False,0.0,False,234.572263 +d12ca302-b458-44bf-b928-6ddef204d9f8,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,bn-fit-modify,21182,8139,29321,1332.206074,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,bn-fit-modify,1332.206074,False,0.0,False,1332.206074 +134c0eed-f520-408e-8d5a-6a27d59d30ba,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-initramfs-qemu,7124,4588,11712,534.182077,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-initramfs-qemu,534.182077,False,0.0,False,534.182077 +ec5caf4f-3214-49ad-a838-4bcda768beb0,gpt-5,openai,hf-model-inference,4421,1643,6064,385.184219,True,1.0,gpt-5,hf-model-inference,385.184219,True,1.0,True,385.184219 +578f6b33-23dd-4fdb-bbcb-a7ae0349bb6d,gpt-5-mini,openai,fix-git,10004,3029,13033,482.476693,True,1.0,gpt-5-mini,fix-git,482.476693,True,0.6,True,482.476693 +d13f8495-2b48-4b15-8658-f186ceb675a4,zai-org/GLM-4.5-Air-FP8,together_ai,regex-log,2910,2818,5728,93.218095,False,0.0,zai-org/GLM-4.5-Air-FP8,regex-log,93.218095,False,0.2,False,93.218095 +2fe66311-4894-4249-96f9-916b8d440e1f,gemini-2.5-pro,gemini,port-compressor,50958,51937,102895,3600.001435,False,0.0,gemini-2.5-pro,port-compressor,3600.001435,False,0.0,False,3600.001435 +44294908-ecd5-430f-adae-accf696ae071,grok-4-0709,xai,dna-insert,963,249,1212,366.976216,False,0.0,grok-4-0709,dna-insert,366.976216,False,0.0,False,366.976216 +3310e3ad-6f71-45af-88bc-1c4dc494de54,grok-4-0709,xai,log-summary-date-ranges,2055,2170,4225,457.625986,False,0.0,grok-4-0709,log-summary-date-ranges,457.625986,False,0.0,False,457.625986 +92c6c990-00ce-4d3c-a165-6902bffa6d9d,deepseek-ai/DeepSeek-V3.1,together_ai,db-wal-recovery,7000,6531,13531,903.474161,False,0.0,deepseek-ai/DeepSeek-V3.1,db-wal-recovery,903.474161,False,0.0,False,903.474161 +f892657e-e2bb-41ef-83e6-cb835192931c,grok-code-fast-1,xai,vulnerable-secret,3467,2473,5940,169.465279,True,1.0,grok-code-fast-1,vulnerable-secret,169.465279,True,0.6,True,169.465279 +6744f165-9919-4ba8-a04c-bddfd0fc46c2,grok-code-fast-1,xai,form-filling,4519,2670,7189,118.443591,True,1.0,grok-code-fast-1,form-filling,118.443591,True,0.6,True,118.443591 +62a80648-5f1e-4b66-a738-227919c138cf,gpt-5-mini,openai,nginx-request-logging,4072,1716,5788,200.33012,True,1.0,gpt-5-mini,nginx-request-logging,200.33012,True,0.4,True,200.33012 +81645c37-250d-47f5-be04-241ef8a8482e,grok-code-fast-1,xai,wasm-pipeline,7212,2901,10113,315.804973,False,0.0,grok-code-fast-1,wasm-pipeline,315.804973,False,0.2,False,315.804973 +9e91ce44-e2b8-48cf-9824-c0284b67194a,gpt-5,openai,merge-diff-arc-agi-task,7776,3474,11250,412.923203,True,1.0,gpt-5,merge-diff-arc-agi-task,412.923203,True,1.0,True,412.923203 +730e39b6-628a-434f-8c44-e2df076c5ed4,claude-sonnet-4-20250514,anthropic,bn-fit-modify,20220,8271,28491,806.876033,True,1.0,claude-sonnet-4-20250514,bn-fit-modify,806.876033,True,0.8,True,806.876033 +f83fb955-0a19-441c-8343-d723811ecf42,gemini-2.5-flash,gemini,chess-best-move,14330,19147,33477,907.158475,False,0.0,gemini-2.5-flash,chess-best-move,907.158475,False,0.0,False,907.158475 +7734c321-1804-4408-b076-2e15f9504101,gemini-2.5-flash,gemini,build-pov-ray,20863,74332,95195,6000.193284,False,0.0,gemini-2.5-flash,build-pov-ray,6000.193284,False,0.0,False,6000.193284 +20b0e75c-448b-4c77-ba8b-a22400256879,zai-org/GLM-4.5-Air-FP8,together_ai,port-compressor,45499,32908,78407,3615.199374,False,0.0,zai-org/GLM-4.5-Air-FP8,port-compressor,3615.199374,False,0.0,False,3615.199374 +2a893b34-3159-499d-ad5c-5cd04f69800f,openai/gpt-oss-120b,together_ai,vulnerable-secret,2771,6590,9361,909.075465,False,0.0,openai/gpt-oss-120b,vulnerable-secret,909.075465,False,0.0,False,909.075465 +2dd57c40-3797-4348-aecf-ac2c11aeac50,claude-sonnet-4-20250514,anthropic,install-windows-3.11,10390,4866,15256,408.177102,False,0.0,claude-sonnet-4-20250514,install-windows-3.11,408.177102,False,0.0,False,408.177102 +c8798727-9608-4677-a115-60c304852b82,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pytorch-model-recovery,21180,11803,32983,900.669141,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pytorch-model-recovery,900.669141,False,0.0,False,900.669141 +70c6ce54-bfdb-4778-a3ee-2417ccebd570,gpt-5-nano,openai,video-processing,2776,2052,4828,145.175298,False,0.0,gpt-5-nano,video-processing,145.175298,False,0.0,False,145.175298 +b219161c-e366-446b-ae52-94a004ee464c,moonshotai/Kimi-K2-Instruct-0905,together_ai,torch-tensor-parallelism,3132,1735,4867,93.879562,False,0.0,moonshotai/Kimi-K2-Instruct-0905,torch-tensor-parallelism,93.879562,False,0.0,False,93.879562 +f7ad557c-12ed-4ce0-8b33-694dbb81190d,claude-sonnet-4-20250514,anthropic,qemu-startup,2797,3426,6223,768.555707,True,1.0,claude-sonnet-4-20250514,qemu-startup,768.555707,True,0.4,True,768.555707 +bb589b01-66a6-4610-89ee-913042e7ac87,OpenAI/gpt-oss-20B,together_ai,code-from-image,210,198,408,32.796986,False,0.0,OpenAI/gpt-oss-20B,code-from-image,32.796986,False,0.0,False,32.796986 +e8552904-cc24-4377-9cf9-732b5db09d74,gemini-2.5-flash,gemini,install-windows-3.11,7093,4647,11740,1228.322464,False,0.0,gemini-2.5-flash,install-windows-3.11,1228.322464,False,0.0,False,1228.322464 +3de59e94-3567-48ee-8d51-13ac73600e40,gpt-5-mini,openai,fix-code-vulnerability,4098,7321,11419,900.312394,False,0.0,gpt-5-mini,fix-code-vulnerability,900.312394,False,0.0,False,900.312394 +5a599397-d5d1-498b-9ba0-6062f8a33ce1,deepseek-ai/DeepSeek-V3.1,together_ai,crack-7z-hash,12995,7497,20492,608.895771,True,1.0,deepseek-ai/DeepSeek-V3.1,crack-7z-hash,608.895771,True,0.8,True,608.895771 +fdc82994-15a6-4eaa-840b-abe86cce435e,gpt-5,openai,sqlite-with-gcov,5210,1299,6509,553.358463,False,0.0,gpt-5,sqlite-with-gcov,553.358463,False,0.3333333333333333,False,553.358463 +1002e53c-73d9-4692-b6d2-0347eeccea75,claude-sonnet-4-20250514,anthropic,schemelike-metacircular-eval,13936,9111,23047,2452.707799,False,0.0,claude-sonnet-4-20250514,schemelike-metacircular-eval,2452.707799,False,0.0,False,2452.707799 +c4976abe-94ca-4a31-9292-bb77ad7e7a46,OpenAI/gpt-oss-20B,together_ai,sparql-university,1876,2381,4257,153.035339,False,0.0,OpenAI/gpt-oss-20B,sparql-university,153.035339,False,0.0,False,153.035339 +07c17916-c56d-420a-9f94-6d10577181e0,gemini-2.5-pro,gemini,install-windows-3.11,6199,1981,8180,246.344728,False,0.0,gemini-2.5-pro,install-windows-3.11,246.344728,False,0.0,False,246.344728 +31e167bc-8931-46b2-bd3d-302b2a65d47d,grok-code-fast-1,xai,log-summary-date-ranges,3819,1353,5172,44.254706,False,0.0,grok-code-fast-1,log-summary-date-ranges,44.254706,False,0.0,False,44.254706 +d888aa36-01b0-4d0f-b388-ed48d1ee41a5,claude-sonnet-4-20250514,anthropic,extract-elf,10950,6162,17112,851.343673,True,1.0,claude-sonnet-4-20250514,extract-elf,851.343673,True,0.2,True,851.343673 +642bf13e-2e14-4932-a934-1fa2f8a4f5e9,openai/gpt-oss-120b,together_ai,db-wal-recovery,4997,7007,12004,213.828565,False,0.0,openai/gpt-oss-120b,db-wal-recovery,213.828565,False,0.0,False,213.828565 +40d35fb2-9ae6-4beb-b77e-ba2bc8c2fa33,claude-opus-4-1-20250805,anthropic,chess-best-move,8520,8008,16528,231.781019,False,0.0,claude-opus-4-1-20250805,chess-best-move,231.781019,False,0.0,False,231.781019 +62df704f-1020-404d-a9d6-e2f27ce0c402,gemini-2.5-flash,gemini,path-tracing-reverse,18447,21241,39688,1816.031548,False,0.0,gemini-2.5-flash,path-tracing-reverse,1816.031548,False,0.0,False,1816.031548 +b59ecf56-52bd-4a33-ad47-8fa0193f959e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,vulnerable-secret,3185,2791,5976,906.910553,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,vulnerable-secret,906.910553,False,0.4,False,906.910553 +f9ac8190-0d0d-4692-9176-e63a23affec3,moonshotai/Kimi-K2-Instruct-0905,together_ai,db-wal-recovery,3425,3940,7365,519.020555,False,0.0,moonshotai/Kimi-K2-Instruct-0905,db-wal-recovery,519.020555,False,0.0,False,519.020555 +440d0bb1-dfbd-4ade-8eac-44e30c4882be,gpt-5-nano,openai,path-tracing-reverse,5699,1913,7612,206.151477,False,0.0,gpt-5-nano,path-tracing-reverse,206.151477,False,0.0,False,206.151477 +f0d20d55-412c-4831-b731-a405f63c9ae6,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-doom-for-mips,9846,3315,13161,363.680174,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-doom-for-mips,363.680174,False,0.0,False,363.680174 +9a390507-2ea7-41cc-a572-200d550b6c5d,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,mteb-leaderboard,1805,1630,3435,142.146844,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,mteb-leaderboard,142.146844,False,0.0,False,142.146844 +da128935-f806-4adf-abb7-ecacc7e7071a,claude-opus-4-1-20250805,anthropic,dna-assembly,14951,9357,24308,734.660342,False,0.0,claude-opus-4-1-20250805,dna-assembly,734.660342,False,0.0,False,734.660342 +d85a7cf9-ca2e-4ac6-902d-46171722c69d,claude-opus-4-1-20250805,anthropic,extract-elf,4938,1910,6848,226.238576,True,1.0,claude-opus-4-1-20250805,extract-elf,226.238576,True,0.8888888888888888,True,226.238576 +87b821c8-0f87-4f4c-a923-60bfb7660416,gpt-5,openai,winning-avg-corewars,30289,27149,57438,3600.55112,False,0.0,gpt-5,winning-avg-corewars,3600.55112,False,0.2857142857142857,False,3600.55112 +b95d8ecb-e09b-413c-8ab1-b4d23f719401,gemini-2.5-flash,gemini,regex-log,1431,1248,2679,232.693721,True,1.0,gemini-2.5-flash,regex-log,232.693721,True,0.8,True,232.693721 +19b6f731-4d6e-4ed7-8a0d-b8dc1329b53a,OpenAI/gpt-oss-20B,together_ai,video-processing,1872,1993,3865,67.445497,False,0.0,OpenAI/gpt-oss-20B,video-processing,67.445497,False,0.0,False,67.445497 +d8d31239-200b-465a-ab52-bb71630fd201,deepseek-ai/DeepSeek-V3.1,together_ai,make-mips-interpreter,26626,22068,48694,1801.022778,False,0.0,deepseek-ai/DeepSeek-V3.1,make-mips-interpreter,1801.022778,False,0.0,False,1801.022778 +feb1c748-359f-462e-ab64-21f015cd04a7,openai/gpt-oss-120b,together_ai,constraints-scheduling,2897,2115,5012,50.011653,True,1.0,openai/gpt-oss-120b,constraints-scheduling,50.011653,True,1.0,True,50.011653 +c1de1b39-aca2-4d3f-b6e3-fff00b000e42,gpt-5-nano,openai,video-processing,3131,2786,5917,125.773703,False,0.0,gpt-5-nano,video-processing,125.773703,False,0.0,False,125.773703 +41c9e386-6900-4781-920c-94c2020fd902,grok-code-fast-1,xai,torch-tensor-parallelism,2143,1225,3368,66.318464,False,0.0,grok-code-fast-1,torch-tensor-parallelism,66.318464,False,0.0,False,66.318464 +b85e18c9-f2b9-4a47-a3b9-b3f50ae506ff,gpt-5,openai,hf-model-inference,7134,3000,10134,643.153518,True,1.0,gpt-5,hf-model-inference,643.153518,True,1.0,True,643.153518 +539e5175-7ae0-4359-b135-698e97ce318b,grok-code-fast-1,xai,nginx-request-logging,3664,1550,5214,195.755936,False,0.0,grok-code-fast-1,nginx-request-logging,195.755936,False,0.0,False,195.755936 +e58c2f42-5754-4b2b-8790-18fca6a2c789,gpt-5-nano,openai,run-pdp11-code,9345,7164,16509,1004.027911,False,0.0,gpt-5-nano,run-pdp11-code,1004.027911,False,0.0,False,1004.027911 +e3cfd3b3-4453-46a4-836c-d8bdec71a9ff,claude-sonnet-4-20250514,anthropic,dna-assembly,18194,13181,31375,777.460307,False,0.0,claude-sonnet-4-20250514,dna-assembly,777.460307,False,0.0,False,777.460307 +b7ceec9f-a5d7-4d8a-8e72-389a7b6f57d5,gemini-2.5-pro,gemini,reshard-c4-data,8164,4104,12268,274.800057,False,0.0,gemini-2.5-pro,reshard-c4-data,274.800057,False,0.0,False,274.800057 +7ccb38d2-3176-48cf-a5c1-9bef862ba465,grok-4-0709,xai,video-processing,16332,9152,25484,1404.157416,False,0.0,grok-4-0709,video-processing,1404.157416,False,0.0,False,1404.157416 +6938d6ee-21ab-4e2c-ab37-99a16aee4b9c,claude-sonnet-4-20250514,anthropic,bn-fit-modify,13098,5983,19081,529.07358,True,1.0,claude-sonnet-4-20250514,bn-fit-modify,529.07358,True,0.8,True,529.07358 +83274880-deb9-49e4-b1b1-bae3269b994c,claude-opus-4-1-20250805,anthropic,configure-git-webserver,6234,1889,8123,523.431272,False,0.0,claude-opus-4-1-20250805,configure-git-webserver,523.431272,False,0.625,False,523.431272 +b9ba8ec3-16f3-4aba-b771-f0c5ac5b894c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-cython-ext,15047,3172,18219,593.283873,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-cython-ext,593.283873,False,0.0,False,593.283873 +0e3bf38e-4a77-4be3-b2d5-004f8b27145b,moonshotai/Kimi-K2-Instruct-0905,together_ai,code-from-image,10597,3542,14139,278.236347,True,1.0,moonshotai/Kimi-K2-Instruct-0905,code-from-image,278.236347,True,0.6,True,278.236347 +4737bd65-f497-4f4f-9586-e30c92d25d55,gemini-2.5-flash,gemini,cancel-async-tasks,1530,1776,3306,111.386539,True,1.0,gemini-2.5-flash,cancel-async-tasks,111.386539,True,0.2,True,111.386539 +9b40c39e-991f-4f66-b788-45ec57a002a8,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-leaderboard,31124,12441,43565,1394.095312,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-leaderboard,1394.095312,False,0.0,False,1394.095312 +0497da47-e286-4ad6-b580-4c2aaf40463c,grok-4-0709,xai,port-compressor,8229,8558,16787,3610.970821,False,0.0,grok-4-0709,port-compressor,3610.970821,False,0.0,False,3610.970821 +fdefef4c-9e51-480e-82d9-33cdf28d806b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,circuit-fibsqrt,23156,20393,43549,3602.424125,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,circuit-fibsqrt,3602.424125,False,0.0,False,3602.424125 +c201cda0-1d24-47f2-a9f9-80f79aadf5d6,moonshotai/Kimi-K2-Instruct-0905,together_ai,filter-js-from-html,6451,6696,13147,775.028371,False,0.0,moonshotai/Kimi-K2-Instruct-0905,filter-js-from-html,775.028371,False,0.0,False,775.028371 +7f1cc64b-59f1-4690-bd6f-3110aface092,claude-opus-4-1-20250805,anthropic,install-klee-minimal,20947,2291,23238,900.001134,False,0.0,claude-opus-4-1-20250805,install-klee-minimal,900.001134,False,0.0,False,900.001134 +916bc4b9-9649-495e-9f85-0f81271cf830,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-code-vulnerability,12737,7105,19842,900.037763,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-code-vulnerability,900.037763,False,0.0,False,900.037763 +ed62e705-c932-4025-88d1-62b3c072d761,gpt-5-nano,openai,fix-ocaml-gc,18846,10558,29404,3636.301606,False,0.0,gpt-5-nano,fix-ocaml-gc,3636.301606,False,0.0,False,3636.301606 +5de0f073-202b-4bb1-81a2-d2922e1f60ab,gemini-2.5-flash,gemini,build-pmars,10574,19961,30535,907.796197,False,0.0,gemini-2.5-flash,build-pmars,907.796197,False,0.8,False,907.796197 +5f4d3c93-9c43-44ed-9570-06627b7467be,grok-4-0709,xai,code-from-image,5830,3872,9702,1200.001493,False,0.0,grok-4-0709,code-from-image,1200.001493,False,0.0,False,1200.001493 +ba414c4f-042f-4d73-ba2a-c4bc05eee3c8,grok-4-0709,xai,write-compressor,1438,545,1983,934.074333,False,0.0,grok-4-0709,write-compressor,934.074333,False,0.0,False,934.074333 +909acbce-5d68-428e-978b-09e519930c8c,openai/gpt-oss-120b,together_ai,log-summary-date-ranges,3216,2627,5843,91.054566,False,0.0,openai/gpt-oss-120b,log-summary-date-ranges,91.054566,False,0.0,False,91.054566 +3daed4e6-68fc-45d1-a338-c8a13c8c0aff,claude-opus-4-1-20250805,anthropic,large-scale-text-editing,4513,4712,9225,1526.991126,True,1.0,claude-opus-4-1-20250805,large-scale-text-editing,1526.991126,True,0.6666666666666666,True,1526.991126 +74f9a8c6-854a-44a0-8c29-7611d07b3080,gpt-5,openai,configure-git-webserver,5524,1948,7472,584.741749,True,1.0,gpt-5,configure-git-webserver,584.741749,True,1.0,True,584.741749 +4ae56090-760a-4635-9528-d708a6624d2e,OpenAI/gpt-oss-20B,together_ai,db-wal-recovery,518,1595,2113,59.896131,False,0.0,OpenAI/gpt-oss-20B,db-wal-recovery,59.896131,False,0.0,False,59.896131 +7c9c2355-4935-4171-addf-d64d8b29ba6a,gpt-5-nano,openai,qemu-alpine-ssh,778,653,1431,958.775217,False,0.0,gpt-5-nano,qemu-alpine-ssh,958.775217,False,0.0,False,958.775217 +637d8a51-12b1-459a-8196-064f13a4e75b,claude-opus-4-1-20250805,anthropic,vulnerable-secret,6014,6599,12613,614.719795,True,1.0,claude-opus-4-1-20250805,vulnerable-secret,614.719795,True,0.625,True,614.719795 +7176447e-59c1-4860-96a9-d5da2c401656,claude-opus-4-1-20250805,anthropic,crack-7z-hash,15273,6708,21981,604.683938,True,1.0,claude-opus-4-1-20250805,crack-7z-hash,604.683938,True,0.8888888888888888,True,604.683938 +7aa3cb3a-60fc-4cf0-bcd2-b47eb8c01aa0,moonshotai/Kimi-K2-Instruct-0905,together_ai,bn-fit-modify,17999,9125,27124,1260.241971,False,0.0,moonshotai/Kimi-K2-Instruct-0905,bn-fit-modify,1260.241971,False,0.0,False,1260.241971 +feaebab0-3b67-47b9-93e9-28033d7cec5f,gemini-2.5-pro,gemini,reshard-c4-data,4515,3068,7583,242.309009,False,0.0,gemini-2.5-pro,reshard-c4-data,242.309009,False,0.0,False,242.309009 +20a6a7f0-0098-4f8b-98f3-0e0fffb04342,zai-org/GLM-4.5-Air-FP8,together_ai,cobol-modernization,11851,11533,23384,902.880442,True,1.0,zai-org/GLM-4.5-Air-FP8,cobol-modernization,902.880442,True,0.4,True,902.880442 +49309084-4303-4efd-9374-e2cf38fddc89,openai/gpt-oss-120b,together_ai,feal-differential-cryptanalysis,2334,1288,3622,273.113123,False,0.0,openai/gpt-oss-120b,feal-differential-cryptanalysis,273.113123,False,0.0,False,273.113123 +c858668d-b216-41b7-8947-f09500bf25f7,gpt-5-mini,openai,wasm-pipeline,1929,1923,3852,140.835801,False,0.0,gpt-5-mini,wasm-pipeline,140.835801,False,0.6,False,140.835801 +243dff01-b3ef-4e14-8257-b3be2f483061,grok-4-0709,xai,openssl-selfsigned-cert,1916,1192,3108,183.724676,False,0.0,grok-4-0709,openssl-selfsigned-cert,183.724676,False,0.0,False,183.724676 +8f2413db-2f65-4407-a2db-9778a2a2abe5,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reverse-engineering,20875,12401,33276,1807.866536,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reverse-engineering,1807.866536,False,0.0,False,1807.866536 +22d89426-a089-451a-af11-74b7b3807e91,zai-org/GLM-4.5-Air-FP8,together_ai,crack-7z-hash,16363,6670,23033,900.99169,False,0.0,zai-org/GLM-4.5-Air-FP8,crack-7z-hash,900.99169,False,0.0,False,900.99169 +9f350085-b024-4dc9-879e-d1de26480524,grok-code-fast-1,xai,sanitize-git-repo,4153,3120,7273,277.016566,False,0.0,grok-code-fast-1,sanitize-git-repo,277.016566,False,0.0,False,277.016566 +0e3d4a47-9082-4c27-b3f3-9129eaae9cdf,zai-org/GLM-4.5-Air-FP8,together_ai,filter-js-from-html,1577,1413,2990,35.26487,False,0.0,zai-org/GLM-4.5-Air-FP8,filter-js-from-html,35.26487,False,0.0,False,35.26487 +a1956742-d1f4-4666-a5a0-000704d5d205,deepseek-ai/DeepSeek-V3.1,together_ai,largest-eigenval,4405,3054,7459,815.661122,True,1.0,deepseek-ai/DeepSeek-V3.1,largest-eigenval,815.661122,True,0.2,True,815.661122 +8ea03f3f-2acc-4739-be0e-f4d728b16fdd,gemini-2.5-flash,gemini,sparql-university,2221,1326,3547,415.639648,False,0.0,gemini-2.5-flash,sparql-university,415.639648,False,0.0,False,415.639648 +f3a3ad4b-e2cb-40a7-ae48-f7108907aa2d,gpt-5-nano,openai,make-mips-interpreter,73310,18897,92207,1807.654461,False,0.0,gpt-5-nano,make-mips-interpreter,1807.654461,False,0.0,False,1807.654461 +deea11ee-e07b-48aa-9b4d-332fc6a95b5d,claude-opus-4-1-20250805,anthropic,form-filling,9847,7880,17727,647.561332,True,1.0,claude-opus-4-1-20250805,form-filling,647.561332,True,1.0,True,647.561332 +a55e2ca9-c471-412f-8960-74314bec3eb8,deepseek-ai/DeepSeek-V3.1,together_ai,merge-diff-arc-agi-task,9582,3352,12934,936.71914,False,0.0,deepseek-ai/DeepSeek-V3.1,merge-diff-arc-agi-task,936.71914,False,0.2,False,936.71914 +ac37274f-8aa4-4e32-b192-db89f2d4fced,deepseek-ai/DeepSeek-V3.1,together_ai,feal-linear-cryptanalysis,32156,28032,60188,1820.259437,False,0.0,deepseek-ai/DeepSeek-V3.1,feal-linear-cryptanalysis,1820.259437,False,0.0,False,1820.259437 +3eff1b3a-3c93-4a74-b83e-1818ba20c3c1,gpt-5,openai,build-cython-ext,6667,2979,9646,953.928777,False,0.0,gpt-5,build-cython-ext,953.928777,False,0.0,False,953.928777 +d21f18be-2a96-4b09-9d50-f83c158dc120,zai-org/GLM-4.5-Air-FP8,together_ai,fix-ocaml-gc,35775,13797,49572,3702.752326,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-ocaml-gc,3702.752326,False,0.0,False,3702.752326 +05238921-61a2-4282-abb4-9204bb623204,gpt-5-mini,openai,constraints-scheduling,4483,4136,8619,257.038028,False,0.0,gpt-5-mini,constraints-scheduling,257.038028,False,0.8,False,257.038028 +be90131b-91f0-4804-98ca-13cd5b1f869e,grok-code-fast-1,xai,fix-code-vulnerability,5359,3486,8845,367.197265,False,0.0,grok-code-fast-1,fix-code-vulnerability,367.197265,False,0.0,False,367.197265 +c8918de4-af8f-42c7-b859-7f6048451477,gpt-5,openai,crack-7z-hash,758,619,1377,56.775652,False,0.0,gpt-5,crack-7z-hash,56.775652,False,0.4285714285714285,False,56.775652 +446ab231-38c5-474f-b4d7-c15d25f82b6b,gpt-5,openai,qemu-startup,3343,2643,5986,553.60153,True,1.0,gpt-5,qemu-startup,553.60153,True,0.8,True,553.60153 +cf660706-c250-4052-ac98-15acccba673f,claude-opus-4-1-20250805,anthropic,wasm-pipeline,4545,2705,7250,319.873497,False,0.0,claude-opus-4-1-20250805,wasm-pipeline,319.873497,False,0.1428571428571428,False,319.873497 +a53dc8c4-095f-417a-9cc0-01167b96fe1d,openai/gpt-oss-120b,together_ai,build-initramfs-qemu,1542,1935,3477,192.336938,False,0.0,openai/gpt-oss-120b,build-initramfs-qemu,192.336938,False,0.0,False,192.336938 +f7ddca7a-26e0-497c-acd3-929095841245,gpt-5,openai,feal-linear-cryptanalysis,15072,5514,20586,887.480821,True,1.0,gpt-5,feal-linear-cryptanalysis,887.480821,True,1.0,True,887.480821 +d1881caf-a6bf-4f24-b6d6-92e4701c9f2d,gpt-5-mini,openai,tune-mjcf,8863,7416,16279,908.167712,False,0.0,gpt-5-mini,tune-mjcf,908.167712,False,0.0,False,908.167712 +41ec1529-01ef-41f5-b5e3-041fdb80059b,claude-opus-4-1-20250805,anthropic,sqlite-db-truncate,9930,7594,17524,486.648373,False,0.0,claude-opus-4-1-20250805,sqlite-db-truncate,486.648373,False,0.125,False,486.648373 +b48e2287-c476-4880-84df-705e261f2f9c,moonshotai/Kimi-K2-Instruct-0905,together_ai,openssl-selfsigned-cert,5504,5146,10650,267.589208,True,1.0,moonshotai/Kimi-K2-Instruct-0905,openssl-selfsigned-cert,267.589208,True,0.6,True,267.589208 +9e72a9be-9370-43c2-8806-ec0d8b681445,claude-opus-4-1-20250805,anthropic,build-initramfs-qemu,1558,1095,2653,941.034192,False,0.0,claude-opus-4-1-20250805,build-initramfs-qemu,941.034192,False,0.0,False,941.034192 +7dd0188d-e6b7-47ac-9e2f-9d2724e89ec7,gemini-2.5-pro,gemini,torch-tensor-parallelism,1800,1268,3068,154.811466,False,0.0,gemini-2.5-pro,torch-tensor-parallelism,154.811466,False,0.0,False,154.811466 +0f43cb55-2c61-45db-9b04-ad48d68f5781,claude-sonnet-4-20250514,anthropic,port-compressor,64591,39159,103750,3617.737665,False,0.0,claude-sonnet-4-20250514,port-compressor,3617.737665,False,0.2,False,3617.737665 +05fa808b-69c8-425a-ac10-7256f8915134,OpenAI/gpt-oss-20B,together_ai,schemelike-metacircular-eval,236,371,607,41.529751,False,0.0,OpenAI/gpt-oss-20B,schemelike-metacircular-eval,41.529751,False,0.0,False,41.529751 +ef1f5c77-2c51-43d9-8967-865f54feabfb,grok-code-fast-1,xai,regex-log,1287,578,1865,54.823073,False,0.0,grok-code-fast-1,regex-log,54.823073,False,0.0,False,54.823073 +3acfc990-885b-473e-a139-e3d42adb6c5a,gemini-2.5-flash,gemini,break-filter-js-from-html,1902,1284,3186,135.464199,False,0.0,gemini-2.5-flash,break-filter-js-from-html,135.464199,False,0.0,False,135.464199 +a8be5d3c-96d8-4a69-a1a5-830ba102fa74,claude-opus-4-1-20250805,anthropic,extract-elf,8126,2996,11122,158.103233,True,1.0,claude-opus-4-1-20250805,extract-elf,158.103233,True,0.8888888888888888,True,158.103233 +423786cc-527b-4470-9401-4ea11ad5623e,gpt-5,openai,polyglot-rust-c,857,1038,1895,900.436422,False,0.0,gpt-5,polyglot-rust-c,900.436422,False,0.0,False,900.436422 +f66e6d5b-d883-4258-927e-630c67613403,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,extract-elf,24312,6705,31017,598.281313,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,extract-elf,598.281313,True,0.6,True,598.281313 +0024b61a-5730-447a-b355-529ac5632ea4,grok-4-0709,xai,password-recovery,6314,1982,8296,900.413332,False,0.0,grok-4-0709,password-recovery,900.413332,False,0.0,False,900.413332 +9c414b15-610b-41f7-bc57-909a6025a9eb,grok-code-fast-1,xai,mteb-leaderboard,1064,804,1868,89.786656,False,0.0,grok-code-fast-1,mteb-leaderboard,89.786656,False,0.0,False,89.786656 +760efc82-9101-4a26-9df3-e87cc0103cb3,gpt-5,openai,vulnerable-secret,4918,3742,8660,417.905626,True,1.0,gpt-5,vulnerable-secret,417.905626,True,0.2857142857142857,True,417.905626 +8e6d32d4-c45c-4db4-a123-4685dbe95f97,openai/gpt-oss-120b,together_ai,sparql-university,2005,2059,4064,92.636642,False,0.0,openai/gpt-oss-120b,sparql-university,92.636642,False,0.0,False,92.636642 +803364a1-8a6d-405a-b9c5-09b8adb8bcce,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-with-gcov,10810,2309,13119,464.546568,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-with-gcov,464.546568,False,0.6,False,464.546568 +aa1d1daa-08fb-4f85-929d-ce91ed1ef9ab,claude-sonnet-4-20250514,anthropic,regex-log,4910,4335,9245,486.005807,True,1.0,claude-sonnet-4-20250514,regex-log,486.005807,True,0.8,True,486.005807 +b52b4b85-cbb6-409e-a3c6-ad272651857e,grok-code-fast-1,xai,sqlite-with-gcov,4714,1225,5939,529.545409,False,0.0,grok-code-fast-1,sqlite-with-gcov,529.545409,False,0.2,False,529.545409 +4d6deb71-731d-4035-9dd3-f06cc813c1dc,zai-org/GLM-4.5-Air-FP8,together_ai,install-klee-minimal,13997,2913,16910,908.189576,False,0.0,zai-org/GLM-4.5-Air-FP8,install-klee-minimal,908.189576,False,0.0,False,908.189576 +34deb58a-e735-4c87-b523-c955da1913ae,grok-4-0709,xai,reshard-c4-data,5039,3439,8478,1685.104608,False,0.0,grok-4-0709,reshard-c4-data,1685.104608,False,0.0,False,1685.104608 +5780953a-ea1a-49eb-b8d6-84f7b1053b33,gpt-5-mini,openai,gpt2-codegolf,1631,1448,3079,177.836258,False,0.0,gpt-5-mini,gpt2-codegolf,177.836258,False,0.0,False,177.836258 +d7511421-da50-4bbe-a619-5586b20bea5a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,gpt2-codegolf,3425,2772,6197,170.261898,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,gpt2-codegolf,170.261898,False,0.0,False,170.261898 +bb4e93a3-bf83-4472-90e6-036592476b29,gpt-5-mini,openai,form-filling,9713,8850,18563,374.630614,True,1.0,gpt-5-mini,form-filling,374.630614,True,1.0,True,374.630614 +f9a3195f-91b9-479e-a27b-f2f1c8a8fdc5,zai-org/GLM-4.5-Air-FP8,together_ai,hf-model-inference,15226,7468,22694,1993.84101,False,0.0,zai-org/GLM-4.5-Air-FP8,hf-model-inference,1993.84101,False,0.8,False,1993.84101 +11670a27-f9ea-4496-9c8c-4b9e04cdc3cb,moonshotai/Kimi-K2-Instruct-0905,together_ai,git-leak-recovery,3088,2740,5828,920.543412,True,1.0,moonshotai/Kimi-K2-Instruct-0905,git-leak-recovery,920.543412,True,1.0,True,920.543412 +9de5fd51-5c7a-4efc-8234-a953a18d7dd7,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,code-from-image,959,438,1397,282.879055,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,code-from-image,282.879055,False,0.4,False,282.879055 +e60f5092-6053-406e-9736-379d4abdc560,grok-4-0709,xai,torch-tensor-parallelism,2052,2250,4302,653.851522,False,0.0,grok-4-0709,torch-tensor-parallelism,653.851522,False,0.0,False,653.851522 +27f34435-87e4-4aae-85a4-1b12f7a2ffe6,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,merge-diff-arc-agi-task,6649,2170,8819,149.666435,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,merge-diff-arc-agi-task,149.666435,False,0.0,False,149.666435 +bc697001-3346-435b-b3c6-8f11bd9ae00f,claude-sonnet-4-20250514,anthropic,make-mips-interpreter,22675,13462,36137,1432.885008,False,0.0,claude-sonnet-4-20250514,make-mips-interpreter,1432.885008,False,0.0,False,1432.885008 +cdf58378-9ea2-4597-960e-503d786bcdc4,gemini-2.5-pro,gemini,dna-insert,1124,393,1517,374.329582,False,0.0,gemini-2.5-pro,dna-insert,374.329582,False,0.0,False,374.329582 +6d63f1db-5ca1-4953-9266-8b6691cd2530,OpenAI/gpt-oss-20B,together_ai,regex-log,346,833,1179,102.965557,False,0.0,OpenAI/gpt-oss-20B,regex-log,102.965557,False,0.0,False,102.965557 +ba379ce3-ad2f-47ae-94b7-890311dd4d7f,openai/gpt-oss-120b,together_ai,reverse-engineering,10007,7549,17556,1802.649992,False,0.0,openai/gpt-oss-120b,reverse-engineering,1802.649992,False,0.2,False,1802.649992 +042e788b-5cbb-44b0-bbbd-de0b43132101,claude-opus-4-1-20250805,anthropic,qemu-alpine-ssh,1329,856,2185,1009.953127,False,0.0,claude-opus-4-1-20250805,qemu-alpine-ssh,1009.953127,False,0.8571428571428571,False,1009.953127 +945b7dc1-8899-406b-b648-4cb0c9e6337e,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,git-leak-recovery,3496,2056,5552,193.680403,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,git-leak-recovery,193.680403,True,1.0,True,193.680403 +1ee83146-5264-419a-8ef7-4596ef601e8e,grok-4-0709,xai,nginx-request-logging,4096,1621,5717,559.380688,True,1.0,grok-4-0709,nginx-request-logging,559.380688,True,1.0,True,559.380688 +97ea7eeb-c160-494b-a119-817c375eb442,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,count-dataset-tokens,8860,1621,10481,932.418981,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,count-dataset-tokens,932.418981,False,0.0,False,932.418981 +6da7bac5-6b1f-4459-915d-ce0e98535ed0,zai-org/GLM-4.5-Air-FP8,together_ai,dna-insert,13777,3342,17119,360.083575,False,0.0,zai-org/GLM-4.5-Air-FP8,dna-insert,360.083575,False,0.0,False,360.083575 +f871f347-cd99-4582-a001-5031520a1252,claude-opus-4-1-20250805,anthropic,install-klee-minimal,8762,1570,10332,900.78486,False,0.0,claude-opus-4-1-20250805,install-klee-minimal,900.78486,False,0.0,False,900.78486 +2bc50ca6-a16a-4228-96e3-72dd4e94cd93,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pmars,8361,3141,11502,305.964842,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pmars,305.964842,False,0.2,False,305.964842 +7ba63556-9ba8-4932-95ac-296dce71b609,gemini-2.5-flash,gemini,filter-js-from-html,11107,6448,17555,900.016529,False,0.0,gemini-2.5-flash,filter-js-from-html,900.016529,False,0.0,False,900.016529 +1aad6804-be75-4542-9fbc-79d5a89b6ab3,gpt-5,openai,pytorch-model-cli,8404,7491,15895,266.112916,False,0.0,gpt-5,pytorch-model-cli,266.112916,False,0.0,False,266.112916 +6f27a6ea-6f12-4bd8-bcac-196bf6b46c42,openai/gpt-oss-120b,together_ai,fix-code-vulnerability,7093,2961,10054,79.437651,False,0.0,openai/gpt-oss-120b,fix-code-vulnerability,79.437651,False,0.0,False,79.437651 +08729cc1-bb32-450c-bc9d-3d1ca07c44a8,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-windows-3.11,7223,3407,10630,249.859577,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-windows-3.11,249.859577,False,0.0,False,249.859577 +654b66e5-8da8-45d6-ae8c-2861742a24cb,gpt-5,openai,regex-log,2008,1739,3747,247.217786,True,1.0,gpt-5,regex-log,247.217786,True,1.0,True,247.217786 +d985b6b2-99b4-436b-9282-e633c1439311,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-db-truncate,14698,13236,27934,912.580101,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-db-truncate,912.580101,False,0.0,False,912.580101 +e2012e6c-2fcd-433e-8557-7618b9517708,moonshotai/Kimi-K2-Instruct-0905,together_ai,largest-eigenval,7616,5725,13341,541.384516,True,1.0,moonshotai/Kimi-K2-Instruct-0905,largest-eigenval,541.384516,True,0.2,True,541.384516 +3010fdc0-0b0a-44c3-9a14-b853a4b54786,grok-code-fast-1,xai,train-fasttext,10261,3282,13543,864.854779,False,0.0,grok-code-fast-1,train-fasttext,864.854779,False,0.0,False,864.854779 +4ea250c0-8e1e-461c-a791-9a56a095bedb,gpt-5-nano,openai,bn-fit-modify,5231,5313,10544,479.923244,False,0.0,gpt-5-nano,bn-fit-modify,479.923244,False,0.0,False,479.923244 +79d64d86-3e7c-4aa5-a892-32a78b9328f2,gpt-5-mini,openai,chess-best-move,19767,14992,34759,902.766475,False,0.0,gpt-5-mini,chess-best-move,902.766475,False,0.0,False,902.766475 +38efde58-2307-4391-a382-738774025928,gemini-2.5-flash,gemini,port-compressor,27060,26435,53495,3600.753661,False,0.0,gemini-2.5-flash,port-compressor,3600.753661,False,0.0,False,3600.753661 +76320ab6-3367-459c-9433-ebdf7a882529,gemini-2.5-pro,gemini,fix-code-vulnerability,7451,3443,10894,574.522182,False,0.0,gemini-2.5-pro,fix-code-vulnerability,574.522182,False,0.2,False,574.522182 +4f9ed2f7-68ac-4fb6-870e-92fb9a0b232f,claude-sonnet-4-20250514,anthropic,cobol-modernization,7522,6501,14023,421.664031,True,1.0,claude-sonnet-4-20250514,cobol-modernization,421.664031,True,1.0,True,421.664031 +79be448e-3684-4991-be44-cc2de2616429,gpt-5,openai,wasm-pipeline,5880,5291,11171,408.366168,True,1.0,gpt-5,wasm-pipeline,408.366168,True,1.0,True,408.366168 +f20d455e-6091-4875-bca0-54a50c72d59c,grok-4-0709,xai,db-wal-recovery,1673,2421,4094,909.460891,False,0.0,grok-4-0709,db-wal-recovery,909.460891,False,0.2,False,909.460891 +eec49838-b1f3-4eb6-b24b-b41872c08fa7,openai/gpt-oss-120b,together_ai,log-summary-date-ranges,1589,933,2522,65.117263,False,0.0,openai/gpt-oss-120b,log-summary-date-ranges,65.117263,False,0.0,False,65.117263 +84edd2dc-c29d-4987-b092-a7702cd0a6db,claude-sonnet-4-20250514,anthropic,configure-git-webserver,6754,2419,9173,869.832717,False,0.0,claude-sonnet-4-20250514,configure-git-webserver,869.832717,False,0.6,False,869.832717 +eef21312-014e-480f-9a90-aee2d4bb6178,claude-opus-4-1-20250805,anthropic,dna-insert,5041,2206,7247,360.748988,False,0.0,claude-opus-4-1-20250805,dna-insert,360.748988,False,0.0,False,360.748988 +e3e8a5dc-d931-446a-b5f8-95798559528e,openai/gpt-oss-120b,together_ai,form-filling,4639,4496,9135,132.03676,True,1.0,openai/gpt-oss-120b,form-filling,132.03676,True,0.6,True,132.03676 +b1fbb71f-78b9-4d03-9cc2-b15ecd62fba8,grok-4-0709,xai,largest-eigenval,2563,1527,4090,962.51849,False,0.0,grok-4-0709,largest-eigenval,962.51849,False,0.0,False,962.51849 +4aac4a6e-83bd-4671-89b1-466635dea80b,gemini-2.5-flash,gemini,sanitize-git-repo,11483,2768,14251,440.454082,False,0.0,gemini-2.5-flash,sanitize-git-repo,440.454082,False,0.0,False,440.454082 +1612d9f0-2390-4305-a058-641caf92a327,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,polyglot-rust-c,8481,6095,14576,314.795301,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,polyglot-rust-c,314.795301,False,0.0,False,314.795301 +1400e1a7-4021-4e2b-985f-1733042c1165,openai/gpt-oss-120b,together_ai,write-compressor,7310,7404,14714,826.793061,False,0.0,openai/gpt-oss-120b,write-compressor,826.793061,False,0.0,False,826.793061 +8b5c92dd-4b5c-40db-86a0-7f930db8c8c5,grok-code-fast-1,xai,cobol-modernization,4489,2425,6914,403.320067,True,1.0,grok-code-fast-1,cobol-modernization,403.320067,True,0.6,True,403.320067 +10e99df9-b28c-4791-85ff-8f9bc2e8cef6,OpenAI/gpt-oss-20B,together_ai,regex-log,1491,1077,2568,73.828295,False,0.0,OpenAI/gpt-oss-20B,regex-log,73.828295,False,0.0,False,73.828295 +fa7ff783-1934-4c01-9b1c-89f429100981,grok-4-0709,xai,sanitize-git-repo,4911,1429,6340,458.522079,False,0.0,grok-4-0709,sanitize-git-repo,458.522079,False,0.0,False,458.522079 +feac42a9-c1b0-4606-a946-91a8c1903182,gpt-5,openai,path-tracing-reverse,7473,3784,11257,733.933442,False,0.0,gpt-5,path-tracing-reverse,733.933442,False,0.0,False,733.933442 +63248a7f-4a6c-4896-a9e5-7a7478ad32a9,grok-code-fast-1,xai,pypi-server,3155,1593,4748,118.283497,True,1.0,grok-code-fast-1,pypi-server,118.283497,True,0.8,True,118.283497 +60a2ba2a-a896-44a3-ae5c-297d8c437384,grok-code-fast-1,xai,model-extraction-relu-logits,2088,772,2860,89.033644,False,0.0,grok-code-fast-1,model-extraction-relu-logits,89.033644,False,0.0,False,89.033644 +07ebf929-fb6b-4afd-a2f2-833e7dcedc67,grok-4-0709,xai,fix-code-vulnerability,8384,4106,12490,912.346991,False,0.0,grok-4-0709,fix-code-vulnerability,912.346991,False,0.2,False,912.346991 +6f88e697-5e8b-4aa2-b1d6-a977771d3126,grok-code-fast-1,xai,run-pdp11-code,1937,1737,3674,210.61015,False,0.0,grok-code-fast-1,run-pdp11-code,210.61015,False,0.0,False,210.61015 +451e5156-cf86-4745-b6eb-fbaae22e6a02,zai-org/GLM-4.5-Air-FP8,together_ai,constraints-scheduling,17964,15314,33278,577.996644,True,1.0,zai-org/GLM-4.5-Air-FP8,constraints-scheduling,577.996644,True,0.8,True,577.996644 +5ad4e3f0-a931-423e-bfec-3ecc95d8d189,claude-opus-4-1-20250805,anthropic,crack-7z-hash,11715,4048,15763,386.362799,True,1.0,claude-opus-4-1-20250805,crack-7z-hash,386.362799,True,0.8888888888888888,True,386.362799 +6509474a-58f9-4e6e-8606-432b533503e4,grok-code-fast-1,xai,distribution-search,3726,2679,6405,366.596882,False,0.0,grok-code-fast-1,distribution-search,366.596882,False,0.0,False,366.596882 +a65031e2-fd31-498a-ad92-9fb2a73ed322,gpt-5,openai,pypi-server,3849,1561,5410,280.939756,False,0.0,gpt-5,pypi-server,280.939756,False,0.3333333333333333,False,280.939756 +128bf28d-0794-4e84-8142-32f5736c5329,claude-opus-4-1-20250805,anthropic,constraints-scheduling,5630,3649,9279,154.718894,True,1.0,claude-opus-4-1-20250805,constraints-scheduling,154.718894,True,0.8888888888888888,True,154.718894 +06feebb8-4f28-4655-be1a-680275f1ab76,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-cython-ext,17013,5001,22014,903.694718,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-cython-ext,903.694718,False,0.0,False,903.694718 +b9cdca01-ed4d-4c34-91bb-2f20c1f67517,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-alpine-ssh,2225,5575,7800,902.799817,False,0.0,deepseek-ai/DeepSeek-V3.1,qemu-alpine-ssh,902.799817,False,0.2,False,902.799817 +fac83c01-9bc6-4848-9eb8-d837ac6bb292,claude-opus-4-1-20250805,anthropic,extract-elf,6823,4234,11057,372.45689,True,1.0,claude-opus-4-1-20250805,extract-elf,372.45689,True,0.8888888888888888,True,372.45689 +0a63537f-7450-4da3-84b4-89cf6044ca72,claude-sonnet-4-20250514,anthropic,wasm-pipeline,11870,6061,17931,835.237167,True,1.0,claude-sonnet-4-20250514,wasm-pipeline,835.237167,True,0.6,True,835.237167 +03860372-7808-4d99-8ea7-f58621da134b,openai/gpt-oss-120b,together_ai,build-pmars,10717,7150,17867,775.80269,True,1.0,openai/gpt-oss-120b,build-pmars,775.80269,True,0.2,True,775.80269 +c2e7a50c-ca6c-4f41-8c44-8e27cb13b82c,zai-org/GLM-4.5-Air-FP8,together_ai,tune-mjcf,10902,8712,19614,908.918819,False,0.0,zai-org/GLM-4.5-Air-FP8,tune-mjcf,908.918819,False,0.0,False,908.918819 +63fba954-9d7d-4241-a98c-56f5d5b65ca6,claude-opus-4-1-20250805,anthropic,largest-eigenval,17703,10800,28503,900.000739,False,0.0,claude-opus-4-1-20250805,largest-eigenval,900.000739,False,0.25,False,900.000739 +e87a402f-bf18-4b9c-96b8-3bf64a5f936d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-doom-for-mips,12327,3860,16187,908.157591,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-doom-for-mips,908.157591,False,0.0,False,908.157591 +7ad798f8-fb44-4af6-bd6d-e7d87a048706,zai-org/GLM-4.5-Air-FP8,together_ai,video-processing,6907,6995,13902,273.544293,False,0.0,zai-org/GLM-4.5-Air-FP8,video-processing,273.544293,False,0.0,False,273.544293 +ad31bfcb-f729-46f9-993d-82cad9da3d46,grok-4-0709,xai,make-mips-interpreter,13527,19873,33400,1801.307985,False,0.0,grok-4-0709,make-mips-interpreter,1801.307985,False,0.0,False,1801.307985 +5270ce53-3149-4a61-a036-9136d049bee3,grok-code-fast-1,xai,write-compressor,9292,6978,16270,587.516028,False,0.0,grok-code-fast-1,write-compressor,587.516028,False,0.0,False,587.516028 +3f5a6d24-6e1d-4bfa-9ebf-56952f550972,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,reverse-engineering,38331,15780,54111,1804.727068,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,reverse-engineering,1804.727068,False,0.0,False,1804.727068 +412f034e-057f-4601-a199-8905f6db9312,gpt-5,openai,winning-avg-corewars,24966,18878,43844,3608.612061,False,0.0,gpt-5,winning-avg-corewars,3608.612061,False,0.2857142857142857,False,3608.612061 +8891155c-f9c4-4757-a04c-60be19301407,grok-code-fast-1,xai,sqlite-with-gcov,5239,1196,6435,190.95286,False,0.0,grok-code-fast-1,sqlite-with-gcov,190.95286,False,0.2,False,190.95286 +41abb8d2-14f3-4af4-9feb-6cf4305f2d4c,OpenAI/gpt-oss-20B,together_ai,qemu-startup,1049,841,1890,510.358335,False,0.0,OpenAI/gpt-oss-20B,qemu-startup,510.358335,False,0.0,False,510.358335 +a3ccf7a6-342a-4b03-999c-06f91aac4bcc,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-pov-ray,16096,5134,21230,1247.643931,True,1.0,moonshotai/Kimi-K2-Instruct-0905,build-pov-ray,1247.643931,True,1.0,True,1247.643931 +374c0fa7-66c5-4562-a639-ed253a56d108,moonshotai/Kimi-K2-Instruct-0905,together_ai,chess-best-move,8759,5892,14651,900.02618,False,0.0,moonshotai/Kimi-K2-Instruct-0905,chess-best-move,900.02618,False,0.0,False,900.02618 +6673573e-76a4-4470-bc75-21c73872264e,zai-org/GLM-4.5-Air-FP8,together_ai,financial-document-processor,8692,3943,12635,193.760596,False,0.0,zai-org/GLM-4.5-Air-FP8,financial-document-processor,193.760596,False,0.0,False,193.760596 +97ab00be-9882-466f-aa3b-b6dd87c118b4,grok-4-0709,xai,feal-differential-cryptanalysis,826,284,1110,1834.810201,False,0.0,grok-4-0709,feal-differential-cryptanalysis,1834.810201,False,0.8,False,1834.810201 +336786f3-44e9-4241-bb51-282b3bfca6c3,OpenAI/gpt-oss-20B,together_ai,fix-git,4352,1347,5699,256.074607,False,0.0,OpenAI/gpt-oss-20B,fix-git,256.074607,False,0.2,False,256.074607 +a8c719a9-8eeb-411a-b548-42c304ac9193,claude-opus-4-1-20250805,anthropic,fix-code-vulnerability,22560,8521,31081,900.000752,False,0.0,claude-opus-4-1-20250805,fix-code-vulnerability,900.000752,False,0.125,False,900.000752 +1e865dba-6639-4ba7-96ef-63d134946042,deepseek-ai/DeepSeek-V3.1,together_ai,hf-model-inference,7466,3085,10551,274.85526,False,0.0,deepseek-ai/DeepSeek-V3.1,hf-model-inference,274.85526,False,0.8,False,274.85526 +3fb70c5d-603d-4a56-9544-1fa6e86acb49,gemini-2.5-flash,gemini,circuit-fibsqrt,25644,85716,111360,3605.343807,False,0.0,gemini-2.5-flash,circuit-fibsqrt,3605.343807,False,0.0,False,3605.343807 +6f2286cb-37a3-427f-affa-a247a637b3f6,grok-code-fast-1,xai,break-filter-js-from-html,2321,1217,3538,149.44933,False,0.0,grok-code-fast-1,break-filter-js-from-html,149.44933,False,0.0,False,149.44933 +f4ece6ec-71bb-4cab-9146-50ee0d232963,openai/gpt-oss-120b,together_ai,crack-7z-hash,10863,4602,15465,900.039488,False,0.0,openai/gpt-oss-120b,crack-7z-hash,900.039488,False,0.0,False,900.039488 +fea40e70-1131-4734-8163-f6de6762c5fb,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,chess-best-move,1332,1100,2432,348.395831,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,chess-best-move,348.395831,False,0.0,False,348.395831 +8e1ba374-b005-4253-9137-67c44aa77c4f,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cobol-modernization,19776,11310,31086,793.406251,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cobol-modernization,793.406251,False,0.0,False,793.406251 +e87af172-92a2-4816-bdc2-d2026892fa9c,gpt-5-mini,openai,regex-log,1690,1313,3003,105.204183,True,1.0,gpt-5-mini,regex-log,105.204183,True,0.8,True,105.204183 +b3927f65-cccc-4385-a034-1d87da8d901a,grok-4-0709,xai,crack-7z-hash,8038,2183,10221,402.887019,True,1.0,grok-4-0709,crack-7z-hash,402.887019,True,0.8,True,402.887019 +a46ecde0-6724-486e-8e17-9f9289e2bb08,claude-sonnet-4-20250514,anthropic,reverse-engineering,10694,11985,22679,1800.460828,False,0.0,claude-sonnet-4-20250514,reverse-engineering,1800.460828,False,0.0,False,1800.460828 +a5625fff-9862-41ac-a2a3-7f0420fce703,grok-code-fast-1,xai,regex-log,1408,746,2154,72.708507,False,0.0,grok-code-fast-1,regex-log,72.708507,False,0.0,False,72.708507 +a722efb7-642d-4194-9b04-050b6555a778,gpt-5-mini,openai,sqlite-db-truncate,6043,5416,11459,308.129346,False,0.0,gpt-5-mini,sqlite-db-truncate,308.129346,False,0.0,False,308.129346 +6b4fb7be-8759-4512-b17d-f08c0998233e,grok-4-0709,xai,make-mips-interpreter,25672,31014,56686,1802.716715,False,0.0,grok-4-0709,make-mips-interpreter,1802.716715,False,0.0,False,1802.716715 +a89e3665-6b62-4a97-a605-9c0f676554a1,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-db-truncate,6151,3454,9605,248.433824,False,0.0,deepseek-ai/DeepSeek-V3.1,sqlite-db-truncate,248.433824,False,0.0,False,248.433824 +6333fe25-886b-45ac-983f-189d825d7f89,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-alpine-ssh,5502,8493,13995,907.926095,True,1.0,deepseek-ai/DeepSeek-V3.1,qemu-alpine-ssh,907.926095,True,0.2,True,907.926095 +b208c1fc-7482-4ea2-a46d-a94992e639fc,gemini-2.5-pro,gemini,winning-avg-corewars,21284,28438,49722,3617.822027,False,0.0,gemini-2.5-pro,winning-avg-corewars,3617.822027,False,0.0,False,3617.822027 +9c21b970-70c9-4ed9-9225-3359366bc77c,claude-opus-4-1-20250805,anthropic,cancel-async-tasks,2650,2149,4799,70.458081,False,0.0,claude-opus-4-1-20250805,cancel-async-tasks,70.458081,False,0.125,False,70.458081 +b45fa4aa-8565-452f-ad00-4bdebde0cc0c,moonshotai/Kimi-K2-Instruct-0905,together_ai,merge-diff-arc-agi-task,20920,9792,30712,382.938725,False,0.0,moonshotai/Kimi-K2-Instruct-0905,merge-diff-arc-agi-task,382.938725,False,0.0,False,382.938725 +59caa329-bdb3-48ad-92e4-c817e42853d1,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,tune-mjcf,13358,8318,21676,534.280481,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,tune-mjcf,534.280481,False,0.0,False,534.280481 +0d33b75d-e4ab-45c6-8530-08016f44cf24,gpt-5-mini,openai,make-doom-for-mips,9654,9208,18862,915.411897,False,0.0,gpt-5-mini,make-doom-for-mips,915.411897,False,0.0,False,915.411897 +476eafbb-d551-42c7-8543-c1d791b4b995,gemini-2.5-pro,gemini,chess-best-move,7756,5912,13668,446.379789,False,0.0,gemini-2.5-pro,chess-best-move,446.379789,False,0.0,False,446.379789 +a9021d08-4108-4d4a-8ef0-541b67f3ea5d,grok-4-0709,xai,tune-mjcf,3213,2781,5994,907.29432,False,0.0,grok-4-0709,tune-mjcf,907.29432,False,0.0,False,907.29432 +90e9c501-2db6-4538-9815-97fe7b2ce0ab,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,distribution-search,3043,2198,5241,305.537301,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,distribution-search,305.537301,False,0.0,False,305.537301 +b02e366d-413e-45ec-bff1-c5270d7568b5,grok-4-0709,xai,distribution-search,1793,1451,3244,1061.994976,False,0.0,grok-4-0709,distribution-search,1061.994976,False,0.4,False,1061.994976 +ac16808b-7371-4eb5-ab24-3359199c89ee,deepseek-ai/DeepSeek-V3.1,together_ai,make-mips-interpreter,27504,28765,56269,1174.320946,False,0.0,deepseek-ai/DeepSeek-V3.1,make-mips-interpreter,1174.320946,False,0.0,False,1174.320946 +ee3043c4-c0a3-497b-b665-6e7658461dc8,gpt-5-mini,openai,adaptive-rejection-sampler,6398,9071,15469,900.037299,False,0.0,gpt-5-mini,adaptive-rejection-sampler,900.037299,False,0.4,False,900.037299 +603b3cb5-35c7-4d2f-84c7-ead220ce665d,claude-sonnet-4-20250514,anthropic,install-windows-3.11,8094,3635,11729,281.134732,False,0.0,claude-sonnet-4-20250514,install-windows-3.11,281.134732,False,0.0,False,281.134732 +5fcb4894-caaa-4ee4-9135-30c95cdfa6a4,openai/gpt-oss-120b,together_ai,wasm-pipeline,10847,10301,21148,925.35537,False,0.0,openai/gpt-oss-120b,wasm-pipeline,925.35537,False,0.0,False,925.35537 +1b938b55-f019-4f28-a957-ca52037f1a7e,openai/gpt-oss-120b,together_ai,winning-avg-corewars,26345,23084,49429,1742.693082,True,1.0,openai/gpt-oss-120b,winning-avg-corewars,1742.693082,True,0.5,True,1742.693082 +0661b9b4-0109-4776-b308-0e28b6c83ada,claude-opus-4-1-20250805,anthropic,form-filling,7815,7210,15025,228.118926,True,1.0,claude-opus-4-1-20250805,form-filling,228.118926,True,1.0,True,228.118926 +8b53bdd3-248a-4f20-8fd1-511eedd6f448,claude-sonnet-4-20250514,anthropic,port-compressor,62662,34618,97280,3600.021671,False,0.0,claude-sonnet-4-20250514,port-compressor,3600.021671,False,0.2,False,3600.021671 +64630eaf-d90e-4033-b7ad-7d2a0996e2c1,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,nginx-request-logging,5021,4010,9031,671.900416,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,nginx-request-logging,671.900416,False,0.0,False,671.900416 +23c9be1f-303c-4779-b2e0-2a989702f0fe,gemini-2.5-flash,gemini,financial-document-processor,8186,4272,12458,496.266184,False,0.0,gemini-2.5-flash,financial-document-processor,496.266184,False,0.0,False,496.266184 +00d6acb4-b0c3-4921-92a9-a79e3ae67325,gpt-5-nano,openai,cancel-async-tasks,4575,5687,10262,722.041626,True,1.0,gpt-5-nano,cancel-async-tasks,722.041626,True,0.4,True,722.041626 +bf5c5796-6487-42b9-884b-8f691ed9a429,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,db-wal-recovery,3323,3560,6883,174.403243,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,db-wal-recovery,174.403243,False,0.0,False,174.403243 +9fd4419d-332d-4803-ac2e-3b01bfff5a3f,OpenAI/gpt-oss-20B,together_ai,winning-avg-corewars,428,1601,2029,40.792568,False,0.0,OpenAI/gpt-oss-20B,winning-avg-corewars,40.792568,False,0.0,False,40.792568 +50549937-d8ca-423d-8be6-f4c5aef66fd9,gemini-2.5-flash,gemini,make-mips-interpreter,30422,80339,110761,1817.152785,False,0.0,gemini-2.5-flash,make-mips-interpreter,1817.152785,False,0.0,False,1817.152785 +7da5b938-c498-4939-8818-e00a125d6cdf,gpt-5-nano,openai,db-wal-recovery,5135,6100,11235,927.362762,False,0.0,gpt-5-nano,db-wal-recovery,927.362762,False,0.0,False,927.362762 +ccd9e1fa-a7ba-4fa0-aa1e-a71b76611493,gpt-5-nano,openai,port-compressor,15874,29889,45763,3624.441471,False,0.0,gpt-5-nano,port-compressor,3624.441471,False,0.0,False,3624.441471 +465c0eb3-2a7c-4df1-b74d-7bd97a67aa0b,grok-code-fast-1,xai,chess-best-move,8377,3519,11896,505.857087,False,0.0,grok-code-fast-1,chess-best-move,505.857087,False,0.0,False,505.857087 +a17c6f0d-3aea-441b-918c-e1cf26e4bc26,gemini-2.5-pro,gemini,sparql-university,4724,2019,6743,271.966533,True,1.0,gemini-2.5-pro,sparql-university,271.966533,True,0.6,True,271.966533 +26971107-e1da-4865-b2cd-3f2a0d3adb91,gemini-2.5-flash,gemini,make-doom-for-mips,28428,10615,39043,915.855123,False,0.0,gemini-2.5-flash,make-doom-for-mips,915.855123,False,0.0,False,915.855123 +b95d03c8-a3bd-48c4-a1db-6fdfa7475cf3,zai-org/GLM-4.5-Air-FP8,together_ai,reshard-c4-data,3671,2567,6238,325.148476,False,0.0,zai-org/GLM-4.5-Air-FP8,reshard-c4-data,325.148476,False,0.0,False,325.148476 +88c78970-7a52-476f-91d3-f1ad5ee2831d,zai-org/GLM-4.5-Air-FP8,together_ai,feal-linear-cryptanalysis,26419,16629,43048,1075.059699,False,0.0,zai-org/GLM-4.5-Air-FP8,feal-linear-cryptanalysis,1075.059699,False,0.0,False,1075.059699 +55db6067-435f-43fd-a308-50ba39bb8106,claude-sonnet-4-20250514,anthropic,sanitize-git-repo,20666,6369,27035,901.269109,False,0.0,claude-sonnet-4-20250514,sanitize-git-repo,901.269109,False,0.0,False,901.269109 +fb47150a-2a37-4c06-b30e-45bfd46fb26a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,fix-ocaml-gc,32675,14301,46976,1780.07684,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,fix-ocaml-gc,1780.07684,False,0.0,False,1780.07684 +7bda9cf0-03c1-4c6d-93dd-d0407cc75b0d,grok-4-0709,xai,mteb-leaderboard,936,429,1365,247.911355,False,0.0,grok-4-0709,mteb-leaderboard,247.911355,False,0.0,False,247.911355 +04d108d2-5331-41d3-8e72-9ae4921c3632,grok-4-0709,xai,financial-document-processor,13460,5499,18959,801.320454,False,0.0,grok-4-0709,financial-document-processor,801.320454,False,0.0,False,801.320454 +8a2a6aa6-40ae-4c52-b368-857173911a92,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,path-tracing-reverse,7058,2515,9573,467.653959,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,path-tracing-reverse,467.653959,False,0.0,False,467.653959 +6d77b365-7e63-4b88-97e1-20d615634800,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,bn-fit-modify,17743,7045,24788,1223.847915,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,bn-fit-modify,1223.847915,False,0.0,False,1223.847915 +9243aa47-ecd9-47ac-8dbf-56a39c956566,openai/gpt-oss-120b,together_ai,video-processing,796,1554,2350,112.399611,False,0.0,openai/gpt-oss-120b,video-processing,112.399611,False,0.0,False,112.399611 +f27753f4-b287-42e6-b84c-120f526d18d5,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-doom-for-mips,17226,5572,22798,921.348261,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-doom-for-mips,921.348261,False,0.0,False,921.348261 +3ae5dc49-8577-4768-bebe-d13281a1e833,gpt-5-mini,openai,feal-linear-cryptanalysis,34601,18391,52992,1805.88624,False,0.0,gpt-5-mini,feal-linear-cryptanalysis,1805.88624,False,0.0,False,1805.88624 +6658a3e1-aceb-463c-bf12-ce4e697d9b2f,gpt-5-nano,openai,make-mips-interpreter,45282,32208,77490,1814.332045,False,0.0,gpt-5-nano,make-mips-interpreter,1814.332045,False,0.0,False,1814.332045 +57d2b30a-0d1a-4531-babe-444bf4b2f64d,zai-org/GLM-4.5-Air-FP8,together_ai,fix-code-vulnerability,7706,5413,13119,250.674926,False,0.0,zai-org/GLM-4.5-Air-FP8,fix-code-vulnerability,250.674926,False,0.0,False,250.674926 +5d608d9c-58fa-4e6d-a287-05b3c1c97090,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,dna-assembly,11313,6296,17609,720.210787,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,dna-assembly,720.210787,False,0.0,False,720.210787 +1edc117a-b336-485a-908c-23b45aa6802f,gemini-2.5-flash,gemini,merge-diff-arc-agi-task,8009,2488,10497,900.054173,False,0.0,gemini-2.5-flash,merge-diff-arc-agi-task,900.054173,False,0.0,False,900.054173 +70a7a9c6-73bc-4892-abd9-7bd13f3dd568,gemini-2.5-pro,gemini,polyglot-c-py,1288,976,2264,188.919988,True,1.0,gemini-2.5-pro,polyglot-c-py,188.919988,True,0.2,True,188.919988 +aa98cd68-5141-49fe-a4de-cdb3cc8946f3,gemini-2.5-flash,gemini,build-cython-ext,15757,4978,20735,1017.33654,False,0.0,gemini-2.5-flash,build-cython-ext,1017.33654,False,0.0,False,1017.33654 +135185e4-0e1f-4bbc-adcc-8eca9aaea319,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-windows-3.11,15020,7415,22435,1177.880196,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-windows-3.11,1177.880196,False,0.0,False,1177.880196 +ede3a59d-a84a-42c1-87ea-d41aae22b464,moonshotai/Kimi-K2-Instruct-0905,together_ai,cobol-modernization,10730,11949,22679,902.580559,True,1.0,moonshotai/Kimi-K2-Instruct-0905,cobol-modernization,902.580559,True,0.6,True,902.580559 +cc11a0a4-f69c-457e-b375-be95a3f2cda9,gemini-2.5-pro,gemini,winning-avg-corewars,18781,24583,43364,3601.276672,False,0.0,gemini-2.5-pro,winning-avg-corewars,3601.276672,False,0.0,False,3601.276672 +9f2e71fc-04ce-4def-bcd6-760a6e8383f8,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-assembly,12648,3749,16397,334.24445,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-assembly,334.24445,False,0.0,False,334.24445 +0774f36f-e195-49c5-af0e-6d912cddd63a,openai/gpt-oss-120b,together_ai,torch-tensor-parallelism,2122,1604,3726,49.128307,False,0.0,openai/gpt-oss-120b,torch-tensor-parallelism,49.128307,False,0.0,False,49.128307 +f8d7a257-9adb-4d09-93de-55cf1a6233ee,gemini-2.5-pro,gemini,prove-plus-comm,2372,2350,4722,383.148952,True,1.0,gemini-2.5-pro,prove-plus-comm,383.148952,True,0.8,True,383.148952 +fdcd4aad-a898-463e-a532-5a40cd5a9e28,OpenAI/gpt-oss-20B,together_ai,financial-document-processor,1042,1798,2840,100.421997,False,0.0,OpenAI/gpt-oss-20B,financial-document-processor,100.421997,False,0.0,False,100.421997 +4dc9ff61-d034-433a-b3f2-d4d2d343f008,claude-opus-4-1-20250805,anthropic,largest-eigenval,21932,15087,37019,900.002217,False,0.0,claude-opus-4-1-20250805,largest-eigenval,900.002217,False,0.25,False,900.002217 +419a276c-f7b8-49cb-8322-453920037ace,gemini-2.5-flash,gemini,port-compressor,31613,46230,77843,3600.002826,False,0.0,gemini-2.5-flash,port-compressor,3600.002826,False,0.0,False,3600.002826 +5dea9c69-032a-4195-9e6e-a495b9ee114b,gpt-5-mini,openai,feal-differential-cryptanalysis,15940,15158,31098,1079.920374,False,0.0,gpt-5-mini,feal-differential-cryptanalysis,1079.920374,False,0.0,False,1079.920374 +c20f0d66-09f1-40af-8f70-cb209fc32bfa,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pypi-server,6280,1916,8196,167.781209,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pypi-server,167.781209,True,0.2,True,167.781209 +28255882-cd6a-4aeb-9850-cd41da942f9f,claude-opus-4-1-20250805,anthropic,bn-fit-modify,10839,4234,15073,2010.089567,True,1.0,claude-opus-4-1-20250805,bn-fit-modify,2010.089567,True,0.875,True,2010.089567 +9c9fe6b9-b32d-42be-a9e6-971e95689235,gemini-2.5-pro,gemini,tune-mjcf,6878,6407,13285,912.093685,False,0.0,gemini-2.5-pro,tune-mjcf,912.093685,False,0.2,False,912.093685 +d1316069-d1c1-4d4f-93bf-27372190b9fb,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,form-filling,3981,1819,5800,286.281921,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,form-filling,286.281921,False,0.0,False,286.281921 +3ac84d45-25ae-4f88-9e30-d17dd0403675,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,pypi-server,3614,1196,4810,128.646041,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,pypi-server,128.646041,False,0.2,False,128.646041 +774fb23d-079f-4374-a253-eed5275fe36b,gemini-2.5-flash,gemini,log-summary-date-ranges,2381,1825,4206,70.699959,False,0.0,gemini-2.5-flash,log-summary-date-ranges,70.699959,False,0.0,False,70.699959 +71a69a77-ee48-4a65-b36b-4eeecf36c854,grok-code-fast-1,xai,pytorch-model-recovery,11100,9728,20828,907.022388,False,0.0,grok-code-fast-1,pytorch-model-recovery,907.022388,False,0.8,False,907.022388 +e7cc511b-f33d-4a36-89ce-76d36801ca40,zai-org/GLM-4.5-Air-FP8,together_ai,circuit-fibsqrt,4033,43565,47598,3605.875561,False,0.0,zai-org/GLM-4.5-Air-FP8,circuit-fibsqrt,3605.875561,False,0.0,False,3605.875561 +e26d29ea-d474-4d51-bc8f-43acaeff5d38,claude-opus-4-1-20250805,anthropic,openssl-selfsigned-cert,4525,3195,7720,439.035807,True,1.0,claude-opus-4-1-20250805,openssl-selfsigned-cert,439.035807,True,1.0,True,439.035807 +16278f11-4364-400b-a421-3e0ccb0320e1,claude-opus-4-1-20250805,anthropic,build-pmars,8553,2417,10970,284.202395,False,0.0,claude-opus-4-1-20250805,build-pmars,284.202395,False,0.5,False,284.202395 +76aa9bb2-cb8f-49bf-af06-aa17a0b6020d,moonshotai/Kimi-K2-Instruct-0905,together_ai,extract-elf,6552,4032,10584,536.281287,True,1.0,moonshotai/Kimi-K2-Instruct-0905,extract-elf,536.281287,True,0.6,True,536.281287 +6ca3e89f-d062-447f-8984-9d8546740405,deepseek-ai/DeepSeek-V3.1,together_ai,tune-mjcf,18535,17835,36370,902.471228,False,0.0,deepseek-ai/DeepSeek-V3.1,tune-mjcf,902.471228,False,0.0,False,902.471228 +ae7b7011-1497-4ef7-9be6-533162879319,deepseek-ai/DeepSeek-V3.1,together_ai,fix-code-vulnerability,14295,6973,21268,905.706249,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-code-vulnerability,905.706249,False,0.2,False,905.706249 +ac89b36e-386b-4d93-813d-c24e88224aae,OpenAI/gpt-oss-20B,together_ai,build-pov-ray,990,2350,3340,106.784039,False,0.0,OpenAI/gpt-oss-20B,build-pov-ray,106.784039,False,0.0,False,106.784039 +9804fe7c-92d8-4761-b3e0-1c95efcedc94,claude-sonnet-4-20250514,anthropic,build-pmars,10725,3813,14538,432.533148,True,1.0,claude-sonnet-4-20250514,build-pmars,432.533148,True,0.6,True,432.533148 +ea45e8cf-2f4c-472b-b6dc-c792a28ece5f,deepseek-ai/DeepSeek-V3.1,together_ai,fix-git,2126,1439,3565,85.629739,True,1.0,deepseek-ai/DeepSeek-V3.1,fix-git,85.629739,True,0.8,True,85.629739 +192b6cc7-cb55-4ccf-974e-c67f8057cad7,gemini-2.5-pro,gemini,fix-ocaml-gc,40536,14593,55129,3604.805525,False,0.0,gemini-2.5-pro,fix-ocaml-gc,3604.805525,False,0.2,False,3604.805525 +8311d80e-48a7-4b96-8df8-c22defb54d7e,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,train-fasttext,19800,7013,26813,2037.41666,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,train-fasttext,2037.41666,False,0.0,False,2037.41666 +a86dab73-5d7f-40b5-846d-f55ce1e0800a,claude-opus-4-1-20250805,anthropic,polyglot-c-py,6012,5853,11865,478.509961,False,0.0,claude-opus-4-1-20250805,polyglot-c-py,478.509961,False,0.0,False,478.509961 +59b877cd-2dcc-4c41-899a-5538c3fd291a,OpenAI/gpt-oss-20B,together_ai,vulnerable-secret,2174,5166,7340,900.965285,False,0.0,OpenAI/gpt-oss-20B,vulnerable-secret,900.965285,False,0.0,False,900.965285 +4b3e9157-d36a-4fc0-841b-ca70a5656b4b,deepseek-ai/DeepSeek-V3.1,together_ai,openssl-selfsigned-cert,5318,4480,9798,208.543046,True,1.0,deepseek-ai/DeepSeek-V3.1,openssl-selfsigned-cert,208.543046,True,1.0,True,208.543046 +019fbdb9-f7d3-4475-a1a5-aaecae0e1a6f,claude-sonnet-4-20250514,anthropic,sanitize-git-repo,13931,5958,19889,917.23959,False,0.0,claude-sonnet-4-20250514,sanitize-git-repo,917.23959,False,0.0,False,917.23959 +dc7859da-6d76-4729-8bdc-f0185ddc6c30,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-doom-for-mips,19042,2786,21828,479.80599,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-doom-for-mips,479.80599,False,0.0,False,479.80599 +42d94c9b-ee4d-4fb8-8dee-d5adfbddc7f7,deepseek-ai/DeepSeek-V3.1,together_ai,password-recovery,2153,1688,3841,1324.567928,False,0.0,deepseek-ai/DeepSeek-V3.1,password-recovery,1324.567928,False,0.0,False,1324.567928 +69d0c7c5-795e-4b27-aeef-1d661fe4c8c6,deepseek-ai/DeepSeek-V3.1,together_ai,dna-insert,8765,4558,13323,411.636049,False,0.0,deepseek-ai/DeepSeek-V3.1,dna-insert,411.636049,False,0.0,False,411.636049 +2ef18b10-d2a9-4857-8d63-f3e631024650,grok-code-fast-1,xai,git-leak-recovery,3727,2923,6650,290.527972,False,0.0,grok-code-fast-1,git-leak-recovery,290.527972,False,0.2,False,290.527972 +5ebb5a6a-3316-4c6a-9f26-2a3bbdab6408,openai/gpt-oss-120b,together_ai,build-pmars,9110,4572,13682,900.501102,False,0.0,openai/gpt-oss-120b,build-pmars,900.501102,False,0.2,False,900.501102 +7bc53f63-700f-4bfa-a688-d925ebbc9e6a,grok-code-fast-1,xai,install-klee-minimal,7075,2660,9735,900.470523,False,0.0,grok-code-fast-1,install-klee-minimal,900.470523,False,0.0,False,900.470523 +26613299-6966-41ae-854d-71cc91bc7a2d,zai-org/GLM-4.5-Air-FP8,together_ai,openssl-selfsigned-cert,3640,2845,6485,204.033374,False,0.0,zai-org/GLM-4.5-Air-FP8,openssl-selfsigned-cert,204.033374,False,0.0,False,204.033374 +f302d744-5403-4158-86c2-bf63c21e8585,zai-org/GLM-4.5-Air-FP8,together_ai,mteb-retrieve,8440,3895,12335,586.633852,False,0.0,zai-org/GLM-4.5-Air-FP8,mteb-retrieve,586.633852,False,0.0,False,586.633852 +af14996c-dcc9-48b5-ada1-a19346018add,gpt-5,openai,pypi-server,4140,1712,5852,209.830223,False,0.0,gpt-5,pypi-server,209.830223,False,0.3333333333333333,False,209.830223 +462f180b-28ea-4829-9bdf-cd1d1408c285,gpt-5-mini,openai,count-dataset-tokens,8915,6511,15426,920.029806,False,0.0,gpt-5-mini,count-dataset-tokens,920.029806,False,0.0,False,920.029806 +94ae7aa9-63c3-4d89-a617-e7f579f290d9,gpt-5,openai,password-recovery,1815,1701,3516,1549.838791,False,0.0,gpt-5,password-recovery,1549.838791,False,0.0,False,1549.838791 +88a3db08-0124-4fa4-b5a2-3230e5b9b19d,claude-opus-4-1-20250805,anthropic,prove-plus-comm,2020,1313,3333,203.618837,True,1.0,claude-opus-4-1-20250805,prove-plus-comm,203.618837,True,1.0,True,203.618837 +ee96708e-0118-4235-8e55-98a88f1b505e,grok-4-0709,xai,constraints-scheduling,3196,1412,4608,591.130595,True,1.0,grok-4-0709,constraints-scheduling,591.130595,True,0.8,True,591.130595 +8da93d19-ff0e-480f-8438-88ce64b88edc,moonshotai/Kimi-K2-Instruct-0905,together_ai,polyglot-c-py,4550,5169,9719,632.136773,False,0.0,moonshotai/Kimi-K2-Instruct-0905,polyglot-c-py,632.136773,False,0.0,False,632.136773 +0540ddf3-3bee-4a30-be57-4e75b7dd4ce7,gemini-2.5-flash,gemini,tune-mjcf,13794,7997,21791,967.592017,False,0.0,gemini-2.5-flash,tune-mjcf,967.592017,False,0.6,False,967.592017 +d082fe58-69a8-4b5d-b0b9-b31b64431875,openai/gpt-oss-120b,together_ai,winning-avg-corewars,9985,5716,15701,847.490415,True,1.0,openai/gpt-oss-120b,winning-avg-corewars,847.490415,True,0.5,True,847.490415 +526f3558-0eee-4a97-b076-85f32773170b,openai/gpt-oss-120b,together_ai,train-fasttext,25517,13144,38661,3625.486346,False,0.0,openai/gpt-oss-120b,train-fasttext,3625.486346,False,0.0,False,3625.486346 +330709c5-8f13-415d-9c64-3b9dfac60680,zai-org/GLM-4.5-Air-FP8,together_ai,install-windows-3.11,5569,2075,7644,221.956582,False,0.0,zai-org/GLM-4.5-Air-FP8,install-windows-3.11,221.956582,False,0.0,False,221.956582 +58cd1a5b-7c80-490f-a5ac-7810ca708f1b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing,7470,8485,15955,1154.238242,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing,1154.238242,False,0.0,False,1154.238242 +4866015e-5bef-43d0-8438-ab03733d0827,gpt-5-nano,openai,install-windows-3.11,40332,25071,65403,3602.906463,False,0.0,gpt-5-nano,install-windows-3.11,3602.906463,False,0.0,False,3602.906463 +826e77bb-4c7c-4e30-b881-40c31a6b208d,claude-opus-4-1-20250805,anthropic,distribution-search,31187,39479,70666,3674.152675,False,0.0,claude-opus-4-1-20250805,distribution-search,3674.152675,False,0.5555555555555556,False,3674.152675 +f7921767-d1dd-436e-babf-328a6c9fb99e,openai/gpt-oss-120b,together_ai,cobol-modernization,5342,3394,8736,173.758361,False,0.0,openai/gpt-oss-120b,cobol-modernization,173.758361,False,0.8,False,173.758361 +c821726f-7ac8-4249-ae40-9a12c199e9b8,claude-opus-4-1-20250805,anthropic,break-filter-js-from-html,11604,10563,22167,1200.301857,False,0.0,claude-opus-4-1-20250805,break-filter-js-from-html,1200.301857,False,0.2222222222222222,False,1200.301857 +c0c8c7e6-7da2-4b5c-9a88-e71423700e72,gemini-2.5-flash,gemini,largest-eigenval,10385,7702,18087,900.406137,False,0.0,gemini-2.5-flash,largest-eigenval,900.406137,False,0.0,False,900.406137 +d1e0c755-7e0b-4d11-85fc-37ea68f7fb90,grok-code-fast-1,xai,prove-plus-comm,2598,2600,5198,223.013114,True,1.0,grok-code-fast-1,prove-plus-comm,223.013114,True,0.4,True,223.013114 +ad2e2a58-29a6-4ebe-8cde-b779f4157310,claude-opus-4-1-20250805,anthropic,cancel-async-tasks,4286,2674,6960,215.321108,False,0.0,claude-opus-4-1-20250805,cancel-async-tasks,215.321108,False,0.125,False,215.321108 +cc10ca74-b490-46f8-aad8-3b3ee7bc84bd,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,chess-best-move,7635,1886,9521,179.982553,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,chess-best-move,179.982553,False,0.0,False,179.982553 +0db59121-da44-4a2f-b202-6d8eaff52d5d,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-initramfs-qemu,6705,4887,11592,352.566952,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-initramfs-qemu,352.566952,False,0.0,False,352.566952 +20f8ecdd-8f35-473c-879f-4fb08321cb48,claude-opus-4-1-20250805,anthropic,wasm-pipeline,9283,2700,11983,312.943763,False,0.0,claude-opus-4-1-20250805,wasm-pipeline,312.943763,False,0.1428571428571428,False,312.943763 +9ddb82b5-7d3a-409a-a40a-7fa36fb80648,grok-code-fast-1,xai,reverse-engineering,8074,3683,11757,751.386512,False,0.0,grok-code-fast-1,reverse-engineering,751.386512,False,0.0,False,751.386512 +bba8477f-3e10-4127-b27f-04ab32196270,gpt-5-mini,openai,path-tracing,38363,36339,74702,1809.692491,False,0.0,gpt-5-mini,path-tracing,1809.692491,False,0.0,False,1809.692491 +176090f4-0f48-4fba-9631-f9a39566165d,deepseek-ai/DeepSeek-V3.1,together_ai,cancel-async-tasks,1764,1070,2834,77.188323,False,0.0,deepseek-ai/DeepSeek-V3.1,cancel-async-tasks,77.188323,False,0.4,False,77.188323 +4cda2590-856b-47f4-a88e-1709f0041087,grok-code-fast-1,xai,polyglot-c-py,1146,434,1580,156.504425,False,0.0,grok-code-fast-1,polyglot-c-py,156.504425,False,0.0,False,156.504425 +6cf723eb-7f40-4780-82ff-74895729a479,grok-code-fast-1,xai,winning-avg-corewars,7549,5364,12913,790.302062,False,0.0,grok-code-fast-1,winning-avg-corewars,790.302062,False,0.0,False,790.302062 +7923a23e-9a79-453c-9a53-13bf733b0482,gpt-5,openai,build-cython-ext,9386,3370,12756,900.471463,False,0.0,gpt-5,build-cython-ext,900.471463,False,0.0,False,900.471463 +b61330e2-0a01-4691-8ddf-658e856ae3b5,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-assembly,10078,4720,14798,733.008006,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-assembly,733.008006,False,0.0,False,733.008006 +5d0d3b90-773b-4b46-9f05-649c93b194b1,zai-org/GLM-4.5-Air-FP8,together_ai,sparql-university,5626,2144,7770,560.913123,False,0.0,zai-org/GLM-4.5-Air-FP8,sparql-university,560.913123,False,0.0,False,560.913123 +8eb0c138-8356-4030-8327-32af4706cdd6,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing-reverse,24412,19978,44390,1811.171133,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing-reverse,1811.171133,False,0.0,False,1811.171133 +28e10d7f-64e9-4b6f-9905-fa9bfed1a9fa,openai/gpt-oss-120b,together_ai,fix-code-vulnerability,22557,14375,36932,982.965566,False,0.0,openai/gpt-oss-120b,fix-code-vulnerability,982.965566,False,0.0,False,982.965566 +b6431da8-b59c-4ca3-8628-25ea57598183,moonshotai/Kimi-K2-Instruct-0905,together_ai,qemu-alpine-ssh,3643,5231,8874,904.611802,False,0.0,moonshotai/Kimi-K2-Instruct-0905,qemu-alpine-ssh,904.611802,False,0.0,False,904.611802 +f49d58a7-dcd5-4f7c-b363-57e7c4bf5ee3,gemini-2.5-flash,gemini,constraints-scheduling,6491,6055,12546,130.979526,True,1.0,gemini-2.5-flash,constraints-scheduling,130.979526,True,0.4,True,130.979526 +46820140-4540-4cfc-8572-0432c2a52f2b,claude-opus-4-1-20250805,anthropic,nginx-request-logging,4911,2206,7117,176.619626,True,1.0,claude-opus-4-1-20250805,nginx-request-logging,176.619626,True,1.0,True,176.619626 +01023f31-1cd1-4510-9f53-ae5ce6016211,gpt-5-mini,openai,reverse-engineering,12898,19726,32624,1371.185391,False,0.0,gpt-5-mini,reverse-engineering,1371.185391,False,0.0,False,1371.185391 +eed1b113-389a-4d74-9ac4-983b7a2b0ab3,zai-org/GLM-4.5-Air-FP8,together_ai,largest-eigenval,9563,8524,18087,339.727485,False,0.0,zai-org/GLM-4.5-Air-FP8,largest-eigenval,339.727485,False,0.0,False,339.727485 +56f114d0-aae4-45b0-87eb-73e6b3221e4e,gemini-2.5-flash,gemini,gpt2-codegolf,1676,1534,3210,96.722721,False,0.0,gemini-2.5-flash,gpt2-codegolf,96.722721,False,0.0,False,96.722721 +84a92b61-e7e8-4c90-a517-ce3b29045974,openai/gpt-oss-120b,together_ai,regex-log,1448,863,2311,73.696373,True,1.0,openai/gpt-oss-120b,regex-log,73.696373,True,0.4,True,73.696373 +06f4219a-bdb7-47dc-861f-e1f5531db679,grok-code-fast-1,xai,chess-best-move,1069,589,1658,47.413769,False,0.0,grok-code-fast-1,chess-best-move,47.413769,False,0.0,False,47.413769 +007eb065-a6d2-4bf2-b86b-4a43b29a50dc,gemini-2.5-pro,gemini,path-tracing,1952,1710,3662,235.540327,False,0.0,gemini-2.5-pro,path-tracing,235.540327,False,0.0,False,235.540327 +b6f70425-b2ed-4016-a90b-cc22140af471,gemini-2.5-flash,gemini,winning-avg-corewars,33255,44130,77385,3600.201056,False,0.0,gemini-2.5-flash,winning-avg-corewars,3600.201056,False,0.0,False,3600.201056 +22285a78-4e32-4db2-aed1-a9c42d4e339d,openai/gpt-oss-120b,together_ai,tune-mjcf,5583,5037,10620,954.618012,False,0.0,openai/gpt-oss-120b,tune-mjcf,954.618012,False,0.2,False,954.618012 +728d538f-d5fd-4007-9d6a-9e6db7198a32,claude-sonnet-4-20250514,anthropic,polyglot-rust-c,13494,14487,27981,909.145594,False,0.0,claude-sonnet-4-20250514,polyglot-rust-c,909.145594,False,0.0,False,909.145594 +606da5f6-091d-4f1e-9220-d1cacd740efc,deepseek-ai/DeepSeek-V3.1,together_ai,password-recovery,5162,4455,9617,906.732553,False,0.0,deepseek-ai/DeepSeek-V3.1,password-recovery,906.732553,False,0.0,False,906.732553 +f7e478f3-c500-4543-b744-ac00c383c202,gemini-2.5-pro,gemini,make-doom-for-mips,21918,4718,26636,908.601223,False,0.0,gemini-2.5-pro,make-doom-for-mips,908.601223,False,0.0,False,908.601223 +49b56163-d8f8-4e2e-9936-a62bc3f89546,claude-opus-4-1-20250805,anthropic,cobol-modernization,1024,263,1287,957.879926,False,0.0,claude-opus-4-1-20250805,cobol-modernization,957.879926,False,0.875,False,957.879926 +bdcadd99-bd58-415a-8d89-6bbaa2e9b102,claude-opus-4-1-20250805,anthropic,model-extraction-relu-logits,10149,7731,17880,440.001537,False,0.0,claude-opus-4-1-20250805,model-extraction-relu-logits,440.001537,False,0.0,False,440.001537 +810dfa21-fb91-47e0-8a7a-12bbd39d4469,grok-code-fast-1,xai,reverse-engineering,11256,4811,16067,560.183296,False,0.0,grok-code-fast-1,reverse-engineering,560.183296,False,0.0,False,560.183296 +71b2cadd-4c07-41d1-94f4-c3c6ff789110,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,model-extraction-relu-logits,2467,3322,5789,136.147757,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,model-extraction-relu-logits,136.147757,False,0.0,False,136.147757 +5beba5f6-6e0e-4f19-b0d3-990df690dd62,gemini-2.5-pro,gemini,vulnerable-secret,6447,2999,9446,236.203981,True,1.0,gemini-2.5-pro,vulnerable-secret,236.203981,True,0.8,True,236.203981 +959c199e-d8c0-4844-bb2c-a935554d12b8,grok-4-0709,xai,wasm-pipeline,8489,3649,12138,676.326044,True,1.0,grok-4-0709,wasm-pipeline,676.326044,True,0.4,True,676.326044 +2103b800-0976-4145-8b02-6801e43d6ff5,gpt-5,openai,extract-elf,5070,4732,9802,105.844648,False,0.0,gpt-5,extract-elf,105.844648,False,0.2857142857142857,False,105.844648 +8619524a-a35f-4bd3-81a0-71b169e5f072,gemini-2.5-pro,gemini,qemu-startup,1111,793,1904,89.109801,False,0.0,gemini-2.5-pro,qemu-startup,89.109801,False,0.2,False,89.109801 +ab1cd615-7d12-4d12-9e38-574737f9a20e,gpt-5-mini,openai,openssl-selfsigned-cert,2398,2647,5045,126.935502,False,0.0,gpt-5-mini,openssl-selfsigned-cert,126.935502,False,0.8,False,126.935502 +1201fa4c-80d4-4052-92f3-00e3055cc4a1,claude-opus-4-1-20250805,anthropic,build-pmars,9641,2375,12016,426.776973,False,0.0,claude-opus-4-1-20250805,build-pmars,426.776973,False,0.5,False,426.776973 +d04d7ced-13f7-42f0-b5ff-5c06ca095503,grok-4-0709,xai,build-pmars,6646,1968,8614,478.532829,False,0.0,grok-4-0709,build-pmars,478.532829,False,0.2,False,478.532829 +bac75088-6e38-43cd-a256-4f5065278f7c,grok-code-fast-1,xai,largest-eigenval,9432,5037,14469,761.680012,False,0.0,grok-code-fast-1,largest-eigenval,761.680012,False,0.0,False,761.680012 +50965709-97d7-4995-a683-704f5a852afd,gpt-5,openai,port-compressor,20991,31169,52160,3634.024205,False,0.0,gpt-5,port-compressor,3634.024205,False,0.0,False,3634.024205 +348f4ebb-349f-40f9-8910-7d2a667b86ec,gemini-2.5-pro,gemini,sqlite-db-truncate,3402,1792,5194,228.332542,False,0.0,gemini-2.5-pro,sqlite-db-truncate,228.332542,False,0.0,False,228.332542 +9ceda5c9-8776-40d5-8044-68e252904863,gpt-5,openai,sqlite-with-gcov,5622,2083,7705,660.777727,True,1.0,gpt-5,sqlite-with-gcov,660.777727,True,0.3333333333333333,True,660.777727 +6d7c73bd-3eaf-4645-9d2d-e1a55411354e,deepseek-ai/DeepSeek-V3.1,together_ai,sqlite-db-truncate,10097,8484,18581,745.641291,False,0.0,deepseek-ai/DeepSeek-V3.1,sqlite-db-truncate,745.641291,False,0.0,False,745.641291 +b32d0c50-0bbf-4c4c-8fe3-cf7ae0abf9b2,gemini-2.5-pro,gemini,sqlite-with-gcov,3501,1418,4919,432.938835,True,1.0,gemini-2.5-pro,sqlite-with-gcov,432.938835,True,0.8,True,432.938835 +b70adf84-8259-45e2-ba79-8ad4dcd87df3,gpt-5,openai,prove-plus-comm,3304,2062,5366,200.330913,True,1.0,gpt-5,prove-plus-comm,200.330913,True,0.8571428571428571,True,200.330913 +9d6947ee-7536-4e7f-b42f-15862c392708,claude-opus-4-1-20250805,anthropic,financial-document-processor,8576,3284,11860,471.766738,False,0.0,claude-opus-4-1-20250805,financial-document-processor,471.766738,False,0.0,False,471.766738 +5f351a46-6d51-4254-9daa-c74ecf3f2d92,OpenAI/gpt-oss-20B,together_ai,hf-model-inference,3008,893,3901,238.969891,True,1.0,OpenAI/gpt-oss-20B,hf-model-inference,238.969891,True,0.4,True,238.969891 +bb0f568e-46fb-43a2-acf1-687610120f15,gpt-5-nano,openai,tune-mjcf,14928,11627,26555,907.992166,False,0.0,gpt-5-nano,tune-mjcf,907.992166,False,0.0,False,907.992166 +0fab9ddc-e434-4ccd-8ffd-b2056f48fabc,grok-4-0709,xai,sparql-university,4828,1135,5963,524.92489,True,1.0,grok-4-0709,sparql-university,524.92489,True,0.4,True,524.92489 +7ab19ed0-bdc0-422b-88a2-03931ee7ff8d,grok-code-fast-1,xai,gpt2-codegolf,1749,1328,3077,47.196831,False,0.0,grok-code-fast-1,gpt2-codegolf,47.196831,False,0.0,False,47.196831 +5693b834-6e6f-4009-9265-694e90b6ae80,gemini-2.5-flash,gemini,fix-git,2548,2462,5010,137.661949,False,0.0,gemini-2.5-flash,fix-git,137.661949,False,0.8,False,137.661949 +09d88c43-88e6-4a98-a6e9-c32e2f1add4b,gpt-5-mini,openai,dna-insert,15099,8081,23180,363.505823,False,0.0,gpt-5-mini,dna-insert,363.505823,False,0.0,False,363.505823 +380f007c-66c4-4d41-bc98-e4c30ead6385,gemini-2.5-flash,gemini,mteb-leaderboard,970,385,1355,35.149628,False,0.0,gemini-2.5-flash,mteb-leaderboard,35.149628,False,0.0,False,35.149628 +345e8069-8623-4b60-b391-40b3a0cb7995,claude-opus-4-1-20250805,anthropic,path-tracing,13203,10588,23791,974.599841,False,0.0,claude-opus-4-1-20250805,path-tracing,974.599841,False,0.0,False,974.599841 +3184d1fb-d2ea-420d-bf73-c4756dc26155,gemini-2.5-flash,gemini,configure-git-webserver,8855,3329,12184,405.264032,False,0.0,gemini-2.5-flash,configure-git-webserver,405.264032,False,0.0,False,405.264032 +e9a8641f-ecd3-412c-995e-4d3eb69c96bb,gpt-5-nano,openai,prove-plus-comm,4820,4422,9242,905.307202,False,0.0,gpt-5-nano,prove-plus-comm,905.307202,False,0.4,False,905.307202 +6f2f91a4-6cc5-40c6-b7ff-dddfbe67367c,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,winning-avg-corewars,6818,3932,10750,543.182002,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,winning-avg-corewars,543.182002,False,0.0,False,543.182002 +9fe16851-4f7d-4908-9cf1-e3b9849a37ed,gpt-5,openai,reverse-engineering,14031,4793,18824,585.201575,True,1.0,gpt-5,reverse-engineering,585.201575,True,0.6666666666666666,True,585.201575 +36eda90b-64ae-4353-a05e-b9c249bcd2ee,openai/gpt-oss-120b,together_ai,install-windows-3.11,6497,2591,9088,265.171101,False,0.0,openai/gpt-oss-120b,install-windows-3.11,265.171101,False,0.0,False,265.171101 +d14f3394-d572-4330-937b-5fd9afa9841e,grok-code-fast-1,xai,code-from-image,780,424,1204,1866.610925,False,0.0,grok-code-fast-1,code-from-image,1866.610925,False,0.0,False,1866.610925 +b441002b-6138-4ade-bfc4-d2ff4d5e55d2,openai/gpt-oss-120b,together_ai,polyglot-c-py,1281,1089,2370,89.113331,False,0.0,openai/gpt-oss-120b,polyglot-c-py,89.113331,False,0.0,False,89.113331 +1c68ee78-4dd8-44b0-b2b9-530f1b920b02,zai-org/GLM-4.5-Air-FP8,together_ai,path-tracing,44873,41144,86017,1804.329302,False,0.0,zai-org/GLM-4.5-Air-FP8,path-tracing,1804.329302,False,0.0,False,1804.329302 +dd71d284-491a-4ff9-999a-3c5b4d5b02b1,gpt-5-mini,openai,constraints-scheduling,4495,3886,8381,276.107046,True,1.0,gpt-5-mini,constraints-scheduling,276.107046,True,0.8,True,276.107046 +e3bc1daf-d874-47c4-977d-9afc42706345,gpt-5,openai,fix-git,3847,1935,5782,138.027554,True,1.0,gpt-5,fix-git,138.027554,True,1.0,True,138.027554 +348e38d8-e712-448a-a243-1c9723bc139d,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-ocaml-gc,28181,8962,37143,3740.214872,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-ocaml-gc,3740.214872,False,0.0,False,3740.214872 +63269270-3db3-4fe4-9521-114dc49ad787,gpt-5,openai,vulnerable-secret,4254,4171,8425,977.156881,False,0.0,gpt-5,vulnerable-secret,977.156881,False,0.2857142857142857,False,977.156881 +4ef30e0f-09d2-441b-b98e-6478ec31defa,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,openssl-selfsigned-cert,1735,1021,2756,44.371112,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,openssl-selfsigned-cert,44.371112,False,0.0,False,44.371112 +e7d7c391-ec9f-4838-9608-ba582af2f270,zai-org/GLM-4.5-Air-FP8,together_ai,pytorch-model-cli,8940,5828,14768,732.785804,False,0.0,zai-org/GLM-4.5-Air-FP8,pytorch-model-cli,732.785804,False,0.0,False,732.785804 +d8f40f19-62e5-495d-ba44-df6c68c1e940,gemini-2.5-pro,gemini,prove-plus-comm,6267,7140,13407,900.049729,False,0.0,gemini-2.5-pro,prove-plus-comm,900.049729,False,0.8,False,900.049729 +ffb2182d-2971-4505-a6c5-728ca507d3b5,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,form-filling,6017,4570,10587,433.688985,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,form-filling,433.688985,True,0.8,True,433.688985 +64ca0768-162b-49b4-95dc-510047e96b06,grok-code-fast-1,xai,chess-best-move,1020,574,1594,64.335596,False,0.0,grok-code-fast-1,chess-best-move,64.335596,False,0.0,False,64.335596 +91f1ca39-a09b-4c21-9c8d-92f41dd28a87,moonshotai/Kimi-K2-Instruct-0905,together_ai,break-filter-js-from-html,7609,9323,16932,1207.503912,False,0.0,moonshotai/Kimi-K2-Instruct-0905,break-filter-js-from-html,1207.503912,False,0.0,False,1207.503912 +b9eccab8-ff11-4122-a4ab-f070a092cd75,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,port-compressor,57858,31571,89429,3620.130999,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,port-compressor,3620.130999,False,0.0,False,3620.130999 +6dcc6a9f-9fdb-4505-a2a5-43521bfcbd9d,gpt-5,openai,dna-insert,7485,7863,15348,360.425853,False,0.0,gpt-5,dna-insert,360.425853,False,0.0,False,360.425853 +a0f86313-2baf-46c9-be00-e7e031832250,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cobol-modernization,3524,1813,5337,918.754158,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cobol-modernization,918.754158,False,0.0,False,918.754158 +f2794c28-0dd2-46b6-80e7-93ca8845989b,zai-org/GLM-4.5-Air-FP8,together_ai,tune-mjcf,8373,9258,17631,903.518,False,0.0,zai-org/GLM-4.5-Air-FP8,tune-mjcf,903.518,False,0.0,False,903.518 +28b74edb-9e8f-4070-9d4b-705ed1b21176,claude-opus-4-1-20250805,anthropic,chess-best-move,7562,5887,13449,271.049721,False,0.0,claude-opus-4-1-20250805,chess-best-move,271.049721,False,0.0,False,271.049721 +7777369a-3e01-4ff5-a2b7-fd87e3795b75,grok-code-fast-1,xai,winning-avg-corewars,10320,14963,25283,2573.111895,False,0.0,grok-code-fast-1,winning-avg-corewars,2573.111895,False,0.0,False,2573.111895 +5a1e5753-f730-46f3-bbff-8b85f290cddc,gemini-2.5-pro,gemini,git-leak-recovery,2066,1219,3285,101.012342,True,1.0,gemini-2.5-pro,git-leak-recovery,101.012342,True,1.0,True,101.012342 +fe3f0b9d-b340-4b27-bf69-892b528bab55,gpt-5,openai,sparql-university,5652,2055,7707,598.274627,True,1.0,gpt-5,sparql-university,598.274627,True,0.8,True,598.274627 +084c53c7-2bba-42f8-b2c2-d848c47b27b5,zai-org/GLM-4.5-Air-FP8,together_ai,db-wal-recovery,5576,8657,14233,740.996391,False,0.0,zai-org/GLM-4.5-Air-FP8,db-wal-recovery,740.996391,False,0.0,False,740.996391 +b52367d7-d6ae-4ac9-befa-b578ea630571,deepseek-ai/DeepSeek-V3.1,together_ai,adaptive-rejection-sampler,12418,5561,17979,904.762378,False,0.0,deepseek-ai/DeepSeek-V3.1,adaptive-rejection-sampler,904.762378,False,0.2,False,904.762378 +3c13f6df-2120-45c9-aeb7-18f6f2824af7,gpt-5,openai,video-processing,5416,4568,9984,219.297213,False,0.0,gpt-5,video-processing,219.297213,False,0.0,False,219.297213 +19613bb6-a28e-40d7-bfdf-d90252c276bc,grok-code-fast-1,xai,polyglot-rust-c,1140,605,1745,134.311927,False,0.0,grok-code-fast-1,polyglot-rust-c,134.311927,False,0.0,False,134.311927 +e2cc54f9-880a-4947-a064-0813b8257e89,gpt-5,openai,path-tracing-reverse,10994,5692,16686,1019.723959,False,0.0,gpt-5,path-tracing-reverse,1019.723959,False,0.0,False,1019.723959 +940dac43-4203-46fe-88cc-9cab0486c7f3,deepseek-ai/DeepSeek-V3.1,together_ai,install-klee-minimal,12600,1713,14313,1730.107276,False,0.0,deepseek-ai/DeepSeek-V3.1,install-klee-minimal,1730.107276,False,0.0,False,1730.107276 +92a32cb3-09d6-4401-96d0-e3a3d278681c,claude-sonnet-4-20250514,anthropic,filter-js-from-html,7716,6981,14697,413.173615,False,0.0,claude-sonnet-4-20250514,filter-js-from-html,413.173615,False,0.0,False,413.173615 +49e7cfda-6d56-4511-bf5f-7745371f2f09,gpt-5-nano,openai,fix-code-vulnerability,9430,5793,15223,487.895402,False,0.0,gpt-5-nano,fix-code-vulnerability,487.895402,False,0.2,False,487.895402 +8619b2de-26fe-47ed-9f7c-df0395e5ed1a,zai-org/GLM-4.5-Air-FP8,together_ai,vulnerable-secret,1669,3449,5118,935.518186,False,0.0,zai-org/GLM-4.5-Air-FP8,vulnerable-secret,935.518186,False,0.0,False,935.518186 +7e11a645-31b9-4cff-915c-405d5ea398a6,gpt-5,openai,polyglot-rust-c,1868,1732,3600,902.240164,False,0.0,gpt-5,polyglot-rust-c,902.240164,False,0.0,False,902.240164 +d3ee9792-1560-48e6-a69e-14b393301e50,gpt-5,openai,sqlite-db-truncate,4086,5185,9271,902.54355,False,0.0,gpt-5,sqlite-db-truncate,902.54355,False,0.0,False,902.54355 +2e2165f4-2983-4238-b452-a2f86d005921,claude-opus-4-1-20250805,anthropic,count-dataset-tokens,13414,3929,17343,550.255913,False,0.0,claude-opus-4-1-20250805,count-dataset-tokens,550.255913,False,0.0,False,550.255913 +4fef5661-ba2f-4530-8cb4-97c9cdcac8b5,claude-opus-4-1-20250805,anthropic,constraints-scheduling,4667,3046,7713,125.657312,True,1.0,claude-opus-4-1-20250805,constraints-scheduling,125.657312,True,0.8888888888888888,True,125.657312 +35e727c3-cd38-465a-b6c0-0284251a3495,claude-sonnet-4-20250514,anthropic,qemu-alpine-ssh,2660,3684,6344,308.400338,True,1.0,claude-sonnet-4-20250514,qemu-alpine-ssh,308.400338,True,0.6,True,308.400338 +a67f954c-f839-4f6d-a842-6c7e0d819d11,gemini-2.5-flash,gemini,reshard-c4-data,8300,4243,12543,698.202098,False,0.0,gemini-2.5-flash,reshard-c4-data,698.202098,False,0.0,False,698.202098 +55e27864-033f-4863-b2fd-2c0fadc49d73,OpenAI/gpt-oss-20B,together_ai,fix-git,1444,2980,4424,103.285848,False,0.0,OpenAI/gpt-oss-20B,fix-git,103.285848,False,0.2,False,103.285848 +681e04ca-e202-457c-84f8-c6ebc49e9565,claude-opus-4-1-20250805,anthropic,sqlite-with-gcov,11135,2378,13513,179.5018,True,1.0,claude-opus-4-1-20250805,sqlite-with-gcov,179.5018,True,0.5714285714285714,True,179.5018 +e88c80e3-b8ad-4aba-9fc3-4377e6e1638b,gpt-5,openai,wasm-pipeline,7482,7369,14851,669.227777,True,1.0,gpt-5,wasm-pipeline,669.227777,True,1.0,True,669.227777 +69dd84c8-9fd9-4c5c-bf16-8c9a5f840430,claude-opus-4-1-20250805,anthropic,tune-mjcf,10533,8032,18565,479.479135,True,1.0,claude-opus-4-1-20250805,tune-mjcf,479.479135,True,0.25,True,479.479135 +58c6c3e7-e6f0-4623-9824-f2e8ceb587d8,claude-opus-4-1-20250805,anthropic,log-summary-date-ranges,7091,1695,8786,106.694388,True,1.0,claude-opus-4-1-20250805,log-summary-date-ranges,106.694388,True,0.8888888888888888,True,106.694388 +8eee870a-d4ed-491b-9bd4-abc0a8b79e60,claude-sonnet-4-20250514,anthropic,path-tracing-reverse,12920,13436,26356,1265.003482,False,0.0,claude-sonnet-4-20250514,path-tracing-reverse,1265.003482,False,0.0,False,1265.003482 +5ff3fb4c-94b4-49d0-b41b-a3afb32a4be5,openai/gpt-oss-120b,together_ai,regex-log,1678,1037,2715,74.322783,False,0.0,openai/gpt-oss-120b,regex-log,74.322783,False,0.4,False,74.322783 +7cad8e0b-1d4e-4f93-91ee-8e159207e8eb,zai-org/GLM-4.5-Air-FP8,together_ai,extract-elf,11838,3206,15044,219.024964,True,1.0,zai-org/GLM-4.5-Air-FP8,extract-elf,219.024964,True,0.4,True,219.024964 +715f036e-2117-4c6f-8027-ad342faf6622,gemini-2.5-pro,gemini,path-tracing,1827,1736,3563,345.822348,False,0.0,gemini-2.5-pro,path-tracing,345.822348,False,0.0,False,345.822348 +6619ff94-0e5a-4ca5-a78a-38509829de94,claude-opus-4-1-20250805,anthropic,sparql-university,5519,2262,7781,265.177911,False,0.0,claude-opus-4-1-20250805,sparql-university,265.177911,False,0.0,False,265.177911 +2627ebe4-7093-49a3-b7d8-52c1459a3272,OpenAI/gpt-oss-20B,together_ai,path-tracing-reverse,5683,20210,25893,1809.183015,False,0.0,OpenAI/gpt-oss-20B,path-tracing-reverse,1809.183015,False,0.0,False,1809.183015 +190bba7d-c99f-4797-b234-c4458aa77244,deepseek-ai/DeepSeek-V3.1,together_ai,circuit-fibsqrt,44846,40786,85632,2142.042451,False,0.0,deepseek-ai/DeepSeek-V3.1,circuit-fibsqrt,2142.042451,False,0.0,False,2142.042451 +cc026822-871a-4d12-b177-572404bf869b,gpt-5-mini,openai,make-mips-interpreter,23731,16925,40656,1105.170292,False,0.0,gpt-5-mini,make-mips-interpreter,1105.170292,False,0.0,False,1105.170292 +d5a46021-57bc-4ce5-a770-79e6a2983a79,claude-opus-4-1-20250805,anthropic,install-windows-3.11,11847,6835,18682,1084.320907,False,0.0,claude-opus-4-1-20250805,install-windows-3.11,1084.320907,False,0.0,False,1084.320907 +a3993ccb-771b-455f-8d62-b26d79bb7df5,claude-opus-4-1-20250805,anthropic,sparql-university,5046,1901,6947,158.460062,False,0.0,claude-opus-4-1-20250805,sparql-university,158.460062,False,0.0,False,158.460062 +4b9a2d74-74c1-4921-929d-f390577ac6b4,gpt-5-mini,openai,fix-ocaml-gc,23970,23732,47702,3605.146151,False,0.0,gpt-5-mini,fix-ocaml-gc,3605.146151,False,0.0,False,3605.146151 +8253632a-5d6e-4cbb-9b1e-17e764ef1f3b,grok-code-fast-1,xai,circuit-fibsqrt,4093,1775,5868,202.291142,False,0.0,grok-code-fast-1,circuit-fibsqrt,202.291142,False,0.0,False,202.291142 +9580118a-58f2-45ae-bb53-04306b57af3a,claude-opus-4-1-20250805,anthropic,qemu-startup,1635,1441,3076,180.506271,True,1.0,claude-opus-4-1-20250805,qemu-startup,180.506271,True,0.4285714285714285,True,180.506271 +e55ecae2-58f3-4d99-8e65-641725906518,gpt-5-mini,openai,feal-linear-cryptanalysis,22351,19984,42335,1815.211643,False,0.0,gpt-5-mini,feal-linear-cryptanalysis,1815.211643,False,0.0,False,1815.211643 +cd7ef01a-96f3-4a9a-9d5a-3855aaf22a7b,claude-sonnet-4-20250514,anthropic,largest-eigenval,13865,10738,24603,949.621664,False,0.0,claude-sonnet-4-20250514,largest-eigenval,949.621664,False,0.0,False,949.621664 +f5e3b5a9-ec3b-46a3-8afe-758653c44ada,gemini-2.5-flash,gemini,polyglot-c-py,1411,15653,17064,438.353602,False,0.0,gemini-2.5-flash,polyglot-c-py,438.353602,False,0.0,False,438.353602 +d8751f5b-3420-49c9-834e-8aeffa48bb6d,grok-4-0709,xai,install-windows-3.11,4839,947,5786,316.196732,False,0.0,grok-4-0709,install-windows-3.11,316.196732,False,0.0,False,316.196732 +e5412bfd-92a1-4748-a489-1e2f03a34940,gemini-2.5-flash,gemini,path-tracing-reverse,9557,11947,21504,1143.986856,False,0.0,gemini-2.5-flash,path-tracing-reverse,1143.986856,False,0.0,False,1143.986856 +dc81e877-45c9-4c2c-bf96-4178a8218847,openai/gpt-oss-120b,together_ai,feal-differential-cryptanalysis,1287,1009,2296,310.606706,False,0.0,openai/gpt-oss-120b,feal-differential-cryptanalysis,310.606706,False,0.0,False,310.606706 +1d4e692a-7b19-48b3-8a23-e7dc8987a42f,claude-opus-4-1-20250805,anthropic,path-tracing,8292,5896,14188,969.49986,False,0.0,claude-opus-4-1-20250805,path-tracing,969.49986,False,0.0,False,969.49986 +0843612c-441a-484f-8a8f-4151d2859afd,claude-opus-4-1-20250805,anthropic,mteb-leaderboard,8830,3518,12348,353.952331,False,0.0,claude-opus-4-1-20250805,mteb-leaderboard,353.952331,False,0.0,False,353.952331 +f8518e6e-75f5-451b-bbf4-e9280009b305,claude-opus-4-1-20250805,anthropic,bn-fit-modify,13808,5090,18898,434.211663,True,1.0,claude-opus-4-1-20250805,bn-fit-modify,434.211663,True,0.875,True,434.211663 +814946c3-3467-4ef8-ad1f-01a8603a594f,moonshotai/Kimi-K2-Instruct-0905,together_ai,mteb-retrieve,3340,2998,6338,254.468697,False,0.0,moonshotai/Kimi-K2-Instruct-0905,mteb-retrieve,254.468697,False,0.0,False,254.468697 +7408f7b8-4c3b-43e1-afa4-58538450a4b4,grok-4-0709,xai,make-doom-for-mips,17138,3636,20774,908.349769,False,0.0,grok-4-0709,make-doom-for-mips,908.349769,False,0.0,False,908.349769 +7532947f-61e9-4afd-96b1-63fa5afef698,claude-sonnet-4-20250514,anthropic,code-from-image,14841,12681,27522,1233.638751,False,0.0,claude-sonnet-4-20250514,code-from-image,1233.638751,False,0.2,False,1233.638751 +f686c6dc-4ad8-4fbe-b859-e54c8940f247,claude-sonnet-4-20250514,anthropic,nginx-request-logging,5615,3651,9266,671.271016,True,1.0,claude-sonnet-4-20250514,nginx-request-logging,671.271016,True,1.0,True,671.271016 +72049f09-05fb-4284-944c-78cfc6d74d3e,OpenAI/gpt-oss-20B,together_ai,dna-insert,3993,9865,13858,382.027021,False,0.0,OpenAI/gpt-oss-20B,dna-insert,382.027021,False,0.0,False,382.027021 +0c694af2-29c8-46f1-8ce4-744ece309e29,moonshotai/Kimi-K2-Instruct-0905,together_ai,regex-log,5498,4295,9793,375.161949,True,1.0,moonshotai/Kimi-K2-Instruct-0905,regex-log,375.161949,True,0.4,True,375.161949 +982f1a75-0a33-4cd5-9802-5550c512ff9b,grok-4-0709,xai,cancel-async-tasks,1321,666,1987,266.975641,False,0.0,grok-4-0709,cancel-async-tasks,266.975641,False,0.0,False,266.975641 +81245d0c-d98b-4f80-b719-f9c193bd5711,deepseek-ai/DeepSeek-V3.1,together_ai,password-recovery,9077,10137,19214,767.896977,False,0.0,deepseek-ai/DeepSeek-V3.1,password-recovery,767.896977,False,0.0,False,767.896977 +fa5dad9c-0b43-465b-9fe6-3386e332def0,grok-4-0709,xai,adaptive-rejection-sampler,5599,2734,8333,902.628289,False,0.0,grok-4-0709,adaptive-rejection-sampler,902.628289,False,0.0,False,902.628289 +043d445e-c060-4c82-8e93-c61ef5faa29d,gemini-2.5-pro,gemini,cobol-modernization,6732,5186,11918,376.961468,True,1.0,gemini-2.5-pro,cobol-modernization,376.961468,True,1.0,True,376.961468 +0235ccea-860e-440c-94b7-8cb224c6a8ac,gpt-5-mini,openai,filter-js-from-html,1517,1627,3144,217.306991,False,0.0,gpt-5-mini,filter-js-from-html,217.306991,False,0.0,False,217.306991 +2ae55719-bbc1-4e65-9991-32578fd559c0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,wasm-pipeline,13686,5255,18941,861.04068,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,wasm-pipeline,861.04068,True,0.6,True,861.04068 +ce940096-d8c0-403b-9396-592a8fac5261,gpt-5-nano,openai,adaptive-rejection-sampler,7755,8669,16424,901.720344,False,0.0,gpt-5-nano,adaptive-rejection-sampler,901.720344,False,0.2,False,901.720344 +1f48f955-08c6-46a1-b7ed-a7f2be8d50c1,claude-sonnet-4-20250514,anthropic,polyglot-c-py,6195,4189,10384,902.81744,False,0.0,claude-sonnet-4-20250514,polyglot-c-py,902.81744,False,0.0,False,902.81744 +7b6aef11-1000-4cef-824d-997cc749602d,gpt-5-nano,openai,torch-tensor-parallelism,10117,7480,17597,900.284344,False,0.0,gpt-5-nano,torch-tensor-parallelism,900.284344,False,0.0,False,900.284344 +83c5abf6-350b-4f37-9a8e-7f16bbde3d10,gpt-5,openai,polyglot-c-py,1740,1845,3585,257.753256,False,0.0,gpt-5,polyglot-c-py,257.753256,False,0.0,False,257.753256 +e3331a99-d920-4031-b3ba-45ff5e1a25a6,gemini-2.5-pro,gemini,large-scale-text-editing,2683,1227,3910,426.761913,False,0.0,gemini-2.5-pro,large-scale-text-editing,426.761913,False,0.4,False,426.761913 +572b1ccd-ce4a-435d-ba9b-c7debe4d9e60,deepseek-ai/DeepSeek-V3.1,together_ai,sanitize-git-repo,10424,3909,14333,269.101973,False,0.0,deepseek-ai/DeepSeek-V3.1,sanitize-git-repo,269.101973,False,0.0,False,269.101973 +6d1ad3fa-5d9c-49f6-838d-a4cb7ba0ceb4,OpenAI/gpt-oss-20B,together_ai,prove-plus-comm,1229,2365,3594,176.746637,False,0.0,OpenAI/gpt-oss-20B,prove-plus-comm,176.746637,False,0.0,False,176.746637 +ed886b6a-946b-46f9-9e0f-56ad3c34a40b,gpt-5-nano,openai,sqlite-with-gcov,12915,3292,16207,849.763498,True,1.0,gpt-5-nano,sqlite-with-gcov,849.763498,True,0.6,True,849.763498 +5e5ed07e-9e6c-4ba0-b3b8-2f2573b48cb7,gpt-5-mini,openai,path-tracing-reverse,32297,25466,57763,1805.006093,False,0.0,gpt-5-mini,path-tracing-reverse,1805.006093,False,0.0,False,1805.006093 +27ddeb92-460d-49e7-bf3d-4766e7c41341,claude-opus-4-1-20250805,anthropic,financial-document-processor,21760,13728,35488,517.630565,False,0.0,claude-opus-4-1-20250805,financial-document-processor,517.630565,False,0.0,False,517.630565 +58dd69a3-14f0-4311-9466-25351a5871e1,gpt-5,openai,mteb-leaderboard,17676,11754,29430,3193.466254,False,0.0,gpt-5,mteb-leaderboard,3193.466254,False,0.0,False,3193.466254 +be97065c-6e2b-4566-bbca-80b37fd00ec3,claude-opus-4-1-20250805,anthropic,openssl-selfsigned-cert,5038,3724,8762,279.75366,True,1.0,claude-opus-4-1-20250805,openssl-selfsigned-cert,279.75366,True,1.0,True,279.75366 +4ffbb745-91b7-425a-b06b-d697df5bb683,moonshotai/Kimi-K2-Instruct-0905,together_ai,distribution-search,23588,17960,41548,2767.392332,False,0.0,moonshotai/Kimi-K2-Instruct-0905,distribution-search,2767.392332,False,0.2,False,2767.392332 +415a3ca5-14da-4beb-88e7-7b0fe89797df,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-assembly,14382,11061,25443,720.409605,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-assembly,720.409605,False,0.0,False,720.409605 +a9a418f6-96ff-4b0c-a07f-d690c26972f9,OpenAI/gpt-oss-20B,together_ai,wasm-pipeline,159,2024,2183,94.347954,False,0.0,OpenAI/gpt-oss-20B,wasm-pipeline,94.347954,False,0.0,False,94.347954 +4ded7305-b551-4435-83d2-75e77477c6ec,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,write-compressor,7086,6349,13435,609.812507,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,write-compressor,609.812507,False,0.0,False,609.812507 +7ce8439a-a147-418c-b2d0-01e121161cb9,gpt-5-mini,openai,video-processing,3472,4155,7627,238.627674,False,0.0,gpt-5-mini,video-processing,238.627674,False,0.0,False,238.627674 +d0958c42-7f97-4c32-b18a-5723277b808d,openai/gpt-oss-120b,together_ai,regex-log,1725,1145,2870,106.013093,False,0.0,openai/gpt-oss-120b,regex-log,106.013093,False,0.4,False,106.013093 +2fda543a-55ec-4299-9fd9-6d6e8cb68c09,grok-code-fast-1,xai,largest-eigenval,8327,5483,13810,949.914758,False,0.0,grok-code-fast-1,largest-eigenval,949.914758,False,0.0,False,949.914758 +caa748fc-ef61-44e1-8c2e-72f685681bd9,gpt-5,openai,build-pov-ray,16976,8423,25399,1508.40576,False,0.0,gpt-5,build-pov-ray,1508.40576,False,0.0,False,1508.40576 +26fccddb-85a4-441d-b623-333763be27c9,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,financial-document-processor,14443,9035,23478,740.859158,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,financial-document-processor,740.859158,False,0.0,False,740.859158 +ddc7930d-eace-4d8c-9b88-f5245baceeaf,zai-org/GLM-4.5-Air-FP8,together_ai,large-scale-text-editing,2818,2026,4844,220.464173,False,0.0,zai-org/GLM-4.5-Air-FP8,large-scale-text-editing,220.464173,False,0.0,False,220.464173 +01c10362-c52b-4818-95a7-2b72996c3baf,OpenAI/gpt-oss-20B,together_ai,sanitize-git-repo,441,694,1135,173.568168,False,0.0,OpenAI/gpt-oss-20B,sanitize-git-repo,173.568168,False,0.0,False,173.568168 +ec2cfd39-9f07-4302-88c8-e67fe228657f,moonshotai/Kimi-K2-Instruct-0905,together_ai,break-filter-js-from-html,2846,2092,4938,1235.606973,False,0.0,moonshotai/Kimi-K2-Instruct-0905,break-filter-js-from-html,1235.606973,False,0.0,False,1235.606973 +34fd79dc-26d3-4791-9b3a-a187d8d5dfe9,gemini-2.5-pro,gemini,financial-document-processor,13997,9901,23898,1206.472336,False,0.0,gemini-2.5-pro,financial-document-processor,1206.472336,False,0.0,False,1206.472336 +2e19f58f-2db6-40f5-a42b-0aad62d039dd,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,torch-tensor-parallelism,1507,684,2191,46.171417,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,torch-tensor-parallelism,46.171417,False,0.0,False,46.171417 +2d67f129-52e9-4c6a-8c0c-4f75f2ad4a50,gpt-5-nano,openai,vulnerable-secret,12721,11305,24026,900.014226,False,0.0,gpt-5-nano,vulnerable-secret,900.014226,False,0.2,False,900.014226 +01ba47ef-b52c-4da6-82b9-4793b4f62243,deepseek-ai/DeepSeek-V3.1,together_ai,wasm-pipeline,9245,6524,15769,829.860657,True,1.0,deepseek-ai/DeepSeek-V3.1,wasm-pipeline,829.860657,True,0.4,True,829.860657 +47ab7c53-5dbb-4629-9b88-49ee1b5ece50,gpt-5-mini,openai,sparql-university,4791,4942,9733,646.661874,False,0.0,gpt-5-mini,sparql-university,646.661874,False,0.0,False,646.661874 +f10129e8-e9fc-4795-b8ba-f76f796b9c36,gpt-5,openai,qemu-startup,1839,1130,2969,193.458991,True,1.0,gpt-5,qemu-startup,193.458991,True,0.8,True,193.458991 +ee1c0775-dcae-4cba-af17-351ab32299c4,gpt-5,openai,largest-eigenval,13169,11066,24235,906.5192,False,0.0,gpt-5,largest-eigenval,906.5192,False,0.0,False,906.5192 +9dcfb3ed-3277-4faa-9b83-785e1ea23455,gpt-5,openai,openssl-selfsigned-cert,2304,1359,3663,124.957272,True,1.0,gpt-5,openssl-selfsigned-cert,124.957272,True,1.0,True,124.957272 +54e713a9-949a-47c7-945f-db4b6d2d2fef,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,distribution-search,3580,2209,5789,432.03825,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,distribution-search,432.03825,False,0.0,False,432.03825 +f200fe6d-e561-4b0e-9776-795ea77562b7,gpt-5,openai,path-tracing-reverse,27045,16008,43053,1800.005368,False,0.0,gpt-5,path-tracing-reverse,1800.005368,False,0.0,False,1800.005368 +b9d66ccb-9b32-438c-b927-5e722433abb6,claude-opus-4-1-20250805,anthropic,large-scale-text-editing,5728,10959,16687,1200.002049,False,0.0,claude-opus-4-1-20250805,large-scale-text-editing,1200.002049,False,0.6666666666666666,False,1200.002049 +49ac1797-42a7-4927-83a7-4929eb4ebf97,openai/gpt-oss-120b,together_ai,port-compressor,15711,17077,32788,3604.644179,False,0.0,openai/gpt-oss-120b,port-compressor,3604.644179,False,0.0,False,3604.644179 +11022477-f3c9-42ca-9d3e-1a0c7f2e4938,claude-opus-4-1-20250805,anthropic,fix-git,3566,2162,5728,250.800174,True,1.0,claude-opus-4-1-20250805,fix-git,250.800174,True,1.0,True,250.800174 +298ce628-6e43-4625-9581-800bdf02f2be,deepseek-ai/DeepSeek-V3.1,together_ai,openssl-selfsigned-cert,4391,3603,7994,125.310997,True,1.0,deepseek-ai/DeepSeek-V3.1,openssl-selfsigned-cert,125.310997,True,1.0,True,125.310997 +f0025690-0fbf-431e-b9c2-82f174c012dd,grok-4-0709,xai,pytorch-model-cli,4883,1225,6108,900.033448,False,0.0,grok-4-0709,pytorch-model-cli,900.033448,False,0.6,False,900.033448 +e4290f35-5807-4061-9b47-e032191b6763,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,db-wal-recovery,4725,5302,10027,547.685419,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,db-wal-recovery,547.685419,False,0.0,False,547.685419 +188e7f6b-3b3e-48fb-a597-d848d8ec37a1,gemini-2.5-flash,gemini,reverse-engineering,30763,27341,58104,1805.156647,False,0.0,gemini-2.5-flash,reverse-engineering,1805.156647,False,0.0,False,1805.156647 +dcd9bf4c-f222-4839-9c74-b8bf09bb1c73,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,nginx-request-logging,5254,3944,9198,819.207408,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,nginx-request-logging,819.207408,False,0.4,False,819.207408 +f9fad111-60cc-45e5-97f4-d66e22b3f12a,gpt-5,openai,break-filter-js-from-html,4597,2969,7566,599.685202,True,1.0,gpt-5,break-filter-js-from-html,599.685202,True,0.4285714285714285,True,599.685202 +500ec7c6-b44d-432c-a63e-e8ceea9e9273,gemini-2.5-pro,gemini,chess-best-move,14786,5919,20705,920.806316,False,0.0,gemini-2.5-pro,chess-best-move,920.806316,False,0.0,False,920.806316 +2d57e2ad-f4f8-4f8c-b800-86d71a2c57a3,deepseek-ai/DeepSeek-V3.1,together_ai,fix-code-vulnerability,16661,7694,24355,905.596019,False,0.0,deepseek-ai/DeepSeek-V3.1,fix-code-vulnerability,905.596019,False,0.2,False,905.596019 +954b12e0-f84f-49fd-b97e-1fce9cd819ea,claude-opus-4-1-20250805,anthropic,feal-linear-cryptanalysis,17801,20594,38395,1803.370024,False,0.0,claude-opus-4-1-20250805,feal-linear-cryptanalysis,1803.370024,False,0.0,False,1803.370024 +5ca8ef08-5382-4f65-8487-2872c9840b17,claude-opus-4-1-20250805,anthropic,distribution-search,10344,9463,19807,335.200085,False,0.0,claude-opus-4-1-20250805,distribution-search,335.200085,False,0.5555555555555556,False,335.200085 +747a96ff-d388-4ec6-9db4-0411c63ec1eb,zai-org/GLM-4.5-Air-FP8,together_ai,password-recovery,7122,10186,17308,906.033574,False,0.0,zai-org/GLM-4.5-Air-FP8,password-recovery,906.033574,False,0.0,False,906.033574 +630206c4-0c29-4798-9ad7-8e52e574e5c3,OpenAI/gpt-oss-20B,together_ai,configure-git-webserver,3640,1528,5168,591.241932,False,0.0,OpenAI/gpt-oss-20B,configure-git-webserver,591.241932,False,0.2,False,591.241932 +2f8b3898-a48b-442d-ae15-96af001754e9,claude-opus-4-1-20250805,anthropic,pypi-server,4683,3020,7703,152.529616,True,1.0,claude-opus-4-1-20250805,pypi-server,152.529616,True,1.0,True,152.529616 +b044de13-2f01-48b2-9006-4e2ed9783d5d,gemini-2.5-pro,gemini,vulnerable-secret,1568,1573,3141,901.357734,False,0.0,gemini-2.5-pro,vulnerable-secret,901.357734,False,0.8,False,901.357734 +98e7d43f-3346-484b-95af-e4f918ce8f56,gpt-5-nano,openai,fix-code-vulnerability,12676,10504,23180,907.712192,False,0.0,gpt-5-nano,fix-code-vulnerability,907.712192,False,0.2,False,907.712192 +57e16a6c-7cf6-4ac5-a6da-24b99ba773b4,claude-opus-4-1-20250805,anthropic,vulnerable-secret,2594,2348,4942,900.486996,False,0.0,claude-opus-4-1-20250805,vulnerable-secret,900.486996,False,0.625,False,900.486996 +92d87607-8518-49f3-8a78-162038017ad1,claude-opus-4-1-20250805,anthropic,qemu-startup,1636,1447,3083,272.279236,True,1.0,claude-opus-4-1-20250805,qemu-startup,272.279236,True,0.4285714285714285,True,272.279236 +f6ef142c-cddf-414e-9068-6f1cac4f6630,deepseek-ai/DeepSeek-V3.1,together_ai,reshard-c4-data,6717,3724,10441,231.644752,False,0.0,deepseek-ai/DeepSeek-V3.1,reshard-c4-data,231.644752,False,0.0,False,231.644752 +10f2c158-abc1-4e84-9853-df0361ebd3ca,gpt-5,openai,fix-code-vulnerability,12420,9950,22370,911.885947,False,0.0,gpt-5,fix-code-vulnerability,911.885947,False,0.0,False,911.885947 +7a68bcc8-7580-42c5-97a1-aa507493420e,claude-opus-4-1-20250805,anthropic,reverse-engineering,37230,23464,60694,1800.012775,False,0.0,claude-opus-4-1-20250805,reverse-engineering,1800.012775,False,0.0,False,1800.012775 +8d442bcd-04d8-42aa-ad4e-834f00602a26,gemini-2.5-pro,gemini,train-fasttext,12858,6461,19319,1510.976587,False,0.0,gemini-2.5-pro,train-fasttext,1510.976587,False,0.0,False,1510.976587 +366d9ddc-1f62-46ec-b15d-321cc1672d20,claude-opus-4-1-20250805,anthropic,prove-plus-comm,1474,1011,2485,38.496605,True,1.0,claude-opus-4-1-20250805,prove-plus-comm,38.496605,True,1.0,True,38.496605 +b5b7d2e1-563b-473f-9676-a07f469c5a01,OpenAI/gpt-oss-20B,together_ai,sqlite-with-gcov,1180,875,2055,28.521407,False,0.0,OpenAI/gpt-oss-20B,sqlite-with-gcov,28.521407,False,0.0,False,28.521407 +07f4f9ae-1f07-461f-90bb-708c8eae9d4f,claude-opus-4-1-20250805,anthropic,build-pov-ray,15477,4885,20362,964.374654,True,1.0,claude-opus-4-1-20250805,build-pov-ray,964.374654,True,0.75,True,964.374654 +b6921fc8-ba73-4754-a4bd-7e9b8c4c6252,gpt-5-nano,openai,torch-tensor-parallelism,4708,5151,9859,900.235168,False,0.0,gpt-5-nano,torch-tensor-parallelism,900.235168,False,0.0,False,900.235168 +970c8cb4-52ad-428f-8bac-eea6bdf5c12a,gemini-2.5-pro,gemini,polyglot-c-py,1573,1785,3358,214.833179,False,0.0,gemini-2.5-pro,polyglot-c-py,214.833179,False,0.2,False,214.833179 +a27ea156-8698-428e-8524-4231144328f1,openai/gpt-oss-120b,together_ai,winning-avg-corewars,4907,2227,7134,117.953503,False,0.0,openai/gpt-oss-120b,winning-avg-corewars,117.953503,False,0.5,False,117.953503 +ff474af8-dabe-444d-b840-3459de901912,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,make-doom-for-mips,23180,5836,29016,916.591087,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,make-doom-for-mips,916.591087,False,0.0,False,916.591087 +0e5a60a4-d10f-47cc-bbd4-375468593069,moonshotai/Kimi-K2-Instruct-0905,together_ai,make-mips-interpreter,26440,18970,45410,2108.757868,False,0.0,moonshotai/Kimi-K2-Instruct-0905,make-mips-interpreter,2108.757868,False,0.0,False,2108.757868 +311e767d-a2f7-408a-95e2-21b355cbc10a,gemini-2.5-flash,gemini,build-initramfs-qemu,1662,3370,5032,276.387594,False,0.0,gemini-2.5-flash,build-initramfs-qemu,276.387594,False,0.0,False,276.387594 +d1b635f8-0053-4f51-9a24-f4275356c3d4,moonshotai/Kimi-K2-Instruct-0905,together_ai,form-filling,6882,5281,12163,467.072363,True,1.0,moonshotai/Kimi-K2-Instruct-0905,form-filling,467.072363,True,0.8,True,467.072363 +a6255b02-f02a-435f-ae05-d19267f26323,claude-opus-4-1-20250805,anthropic,path-tracing-reverse,40317,31102,71419,1809.098062,False,0.0,claude-opus-4-1-20250805,path-tracing-reverse,1809.098062,False,0.0,False,1809.098062 +3e8237d5-c0a5-468e-a9c9-c31bd18b6cc6,gpt-5,openai,password-recovery,3955,7733,11688,900.329749,False,0.0,gpt-5,password-recovery,900.329749,False,0.0,False,900.329749 +58fa34e5-e5c1-4e85-ba33-a19c5fb072e7,moonshotai/Kimi-K2-Instruct-0905,together_ai,merge-diff-arc-agi-task,7183,2099,9282,907.826836,False,0.0,moonshotai/Kimi-K2-Instruct-0905,merge-diff-arc-agi-task,907.826836,False,0.0,False,907.826836 +68de687c-2d48-4eef-8a95-c8fab032bafc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-cython-ext,21829,4327,26156,911.856535,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-cython-ext,911.856535,False,0.0,False,911.856535 +6dbde439-fda8-4773-8da3-e6ac16d5e25d,moonshotai/Kimi-K2-Instruct-0905,together_ai,prove-plus-comm,5247,5612,10859,684.233345,True,1.0,moonshotai/Kimi-K2-Instruct-0905,prove-plus-comm,684.233345,True,0.8,True,684.233345 +ded69ace-95cd-43ca-ab69-53632c0b4ab4,gpt-5,openai,tune-mjcf,9645,5465,15110,900.001077,False,0.0,gpt-5,tune-mjcf,900.001077,False,0.0,False,900.001077 +d068d0c2-582f-48b7-9a82-b38acbbb4330,deepseek-ai/DeepSeek-V3.1,together_ai,prove-plus-comm,1955,1536,3491,351.333096,True,1.0,deepseek-ai/DeepSeek-V3.1,prove-plus-comm,351.333096,True,1.0,True,351.333096 +1e9848b6-6cbf-47d0-b688-b3cd14b4b65b,zai-org/GLM-4.5-Air-FP8,together_ai,train-fasttext,27853,7368,35221,3625.402805,False,0.0,zai-org/GLM-4.5-Air-FP8,train-fasttext,3625.402805,False,0.2,False,3625.402805 +e6babc3c-9239-4b02-adde-6958d6581dea,gemini-2.5-pro,gemini,largest-eigenval,8747,5998,14745,919.057432,False,0.0,gemini-2.5-pro,largest-eigenval,919.057432,False,0.0,False,919.057432 +5e963ba5-83a1-419e-b28a-a37e71fe6c3d,gpt-5-mini,openai,db-wal-recovery,7846,6916,14762,971.119018,False,0.0,gpt-5-mini,db-wal-recovery,971.119018,False,0.0,False,971.119018 +f74ca665-6f58-40c0-a87c-3818356c870a,OpenAI/gpt-oss-20B,together_ai,sparql-university,684,2094,2778,188.446694,False,0.0,OpenAI/gpt-oss-20B,sparql-university,188.446694,False,0.0,False,188.446694 +bc506962-76de-4eed-9f96-d8646f41928c,claude-sonnet-4-20250514,anthropic,openssl-selfsigned-cert,4916,4300,9216,418.451482,True,1.0,claude-sonnet-4-20250514,openssl-selfsigned-cert,418.451482,True,0.8,True,418.451482 +d5b82da5-ddac-41dc-8340-203c197abeec,moonshotai/Kimi-K2-Instruct-0905,together_ai,count-dataset-tokens,13927,3527,17454,938.349622,False,0.0,moonshotai/Kimi-K2-Instruct-0905,count-dataset-tokens,938.349622,False,0.2,False,938.349622 +6da7c904-8450-4224-b003-a73b3106c338,gpt-5,openai,dna-assembly,12232,14311,26543,750.654915,False,0.0,gpt-5,dna-assembly,750.654915,False,0.0,False,750.654915 +7882256a-af1c-4a07-a2c2-7af24d13189f,gpt-5,openai,merge-diff-arc-agi-task,10935,7183,18118,552.292243,True,1.0,gpt-5,merge-diff-arc-agi-task,552.292243,True,1.0,True,552.292243 +1695b04b-4ecd-4a43-92e9-c7fd5b10402e,grok-4-0709,xai,fix-ocaml-gc,27701,10782,38483,2947.333315,False,0.0,grok-4-0709,fix-ocaml-gc,2947.333315,False,0.0,False,2947.333315 +db6055f0-30ab-4002-96ba-2940d11a7570,OpenAI/gpt-oss-20B,together_ai,torch-tensor-parallelism,918,1027,1945,37.545308,False,0.0,OpenAI/gpt-oss-20B,torch-tensor-parallelism,37.545308,False,0.0,False,37.545308 +75393222-87a2-44ca-bd50-1ff1d800d81f,gpt-5-nano,openai,code-from-image,1064,531,1595,56.311326,False,0.0,gpt-5-nano,code-from-image,56.311326,False,0.0,False,56.311326 +15d03be4-680f-429b-bb5b-b736edcf1895,openai/gpt-oss-120b,together_ai,git-leak-recovery,4481,4986,9467,349.064746,True,1.0,openai/gpt-oss-120b,git-leak-recovery,349.064746,True,0.2,True,349.064746 +67ae6ce5-6de7-4bab-92ed-eea54262aadd,OpenAI/gpt-oss-20B,together_ai,nginx-request-logging,6325,10348,16673,1036.412356,False,0.0,OpenAI/gpt-oss-20B,nginx-request-logging,1036.412356,False,0.0,False,1036.412356 +04c418bf-6408-49af-8cb0-063ba47cac4f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sqlite-with-gcov,10358,2231,12589,536.338517,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sqlite-with-gcov,536.338517,True,0.6,True,536.338517 +e60beead-339e-4e52-96d0-abc7d794157c,claude-opus-4-1-20250805,anthropic,sparql-university,5112,2092,7204,199.160967,False,0.0,claude-opus-4-1-20250805,sparql-university,199.160967,False,0.0,False,199.160967 +93065444-5a6d-4e75-a99f-1399973871b0,gemini-2.5-flash,gemini,video-processing,2743,2224,4967,130.618015,False,0.0,gemini-2.5-flash,video-processing,130.618015,False,0.0,False,130.618015 +9d23b336-3fc2-4536-a311-817fd8e460ba,claude-opus-4-1-20250805,anthropic,circuit-fibsqrt,35404,43191,78595,3546.749669,False,0.0,claude-opus-4-1-20250805,circuit-fibsqrt,3546.749669,False,0.0,False,3546.749669 +30aa52df-108a-41fe-9a83-b1e68ea63abb,moonshotai/Kimi-K2-Instruct-0905,together_ai,openssl-selfsigned-cert,3707,2755,6462,225.513232,False,0.0,moonshotai/Kimi-K2-Instruct-0905,openssl-selfsigned-cert,225.513232,False,0.6,False,225.513232 +f0407181-42a8-42f4-bc96-450f35a84397,gpt-5-mini,openai,circuit-fibsqrt,5144,3200,8344,468.453283,False,0.0,gpt-5-mini,circuit-fibsqrt,468.453283,False,0.0,False,468.453283 +5c754e1c-5656-4539-9798-affc4df166b6,moonshotai/Kimi-K2-Instruct-0905,together_ai,nginx-request-logging,4961,3167,8128,624.23191,False,0.0,moonshotai/Kimi-K2-Instruct-0905,nginx-request-logging,624.23191,False,0.4,False,624.23191 +b47fcd39-a3cb-4d0e-992e-41c130136f58,OpenAI/gpt-oss-20B,together_ai,extract-elf,771,882,1653,57.894756,False,0.0,OpenAI/gpt-oss-20B,extract-elf,57.894756,False,0.2,False,57.894756 +15600a7e-617c-497b-b760-32a2c35797f9,deepseek-ai/DeepSeek-V3.1,together_ai,make-doom-for-mips,15795,3931,19726,904.182245,False,0.0,deepseek-ai/DeepSeek-V3.1,make-doom-for-mips,904.182245,False,0.0,False,904.182245 +13248c77-6e02-40db-85af-dd677750d2a6,gpt-5-nano,openai,reshard-c4-data,21702,24783,46485,900.162178,False,0.0,gpt-5-nano,reshard-c4-data,900.162178,False,0.0,False,900.162178 +c1bc29a2-e8d6-4d3d-95f0-6e1abd61a50b,openai/gpt-oss-120b,together_ai,path-tracing,4118,3360,7478,241.042023,False,0.0,openai/gpt-oss-120b,path-tracing,241.042023,False,0.0,False,241.042023 +a80bb35e-fba3-4f56-90d8-1d5d82ae9f20,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,build-initramfs-qemu,10404,5859,16263,900.70822,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,build-initramfs-qemu,900.70822,False,0.0,False,900.70822 +5d203aaf-d47f-4e4f-bb7b-8d466266e66f,gemini-2.5-pro,gemini,circuit-fibsqrt,4409,3631,8040,266.591979,False,0.0,gemini-2.5-pro,circuit-fibsqrt,266.591979,False,0.0,False,266.591979 +9a7afbcd-4b33-4d6f-9820-044158f8f40d,moonshotai/Kimi-K2-Instruct-0905,together_ai,constraints-scheduling,6000,4320,10320,424.373953,True,1.0,moonshotai/Kimi-K2-Instruct-0905,constraints-scheduling,424.373953,True,0.6,True,424.373953 +1153a511-4f5a-4df4-a342-b1946cacfab3,grok-code-fast-1,xai,cancel-async-tasks,1406,594,2000,58.514461,False,0.0,grok-code-fast-1,cancel-async-tasks,58.514461,False,0.2,False,58.514461 +8012e1aa-9396-481c-8a5f-f0178fe489c8,claude-opus-4-1-20250805,anthropic,install-windows-3.11,8926,2743,11669,1165.921848,False,0.0,claude-opus-4-1-20250805,install-windows-3.11,1165.921848,False,0.0,False,1165.921848 +f56fe099-e01e-4440-89a5-da255386bf42,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,distribution-search,5188,4877,10065,317.376645,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,distribution-search,317.376645,True,0.4,True,317.376645 +0c33b640-b2e5-487e-8fd1-70e77c7fb4b1,zai-org/GLM-4.5-Air-FP8,together_ai,circuit-fibsqrt,10145,23992,34137,3604.425977,False,0.0,zai-org/GLM-4.5-Air-FP8,circuit-fibsqrt,3604.425977,False,0.0,False,3604.425977 +7c502efa-440c-4d72-8ee6-ccc591cc85f8,gpt-5-mini,openai,bn-fit-modify,15358,16055,31413,922.214965,True,1.0,gpt-5-mini,bn-fit-modify,922.214965,True,0.6,True,922.214965 +72df27a6-6388-444c-8136-2f3c5e524404,grok-code-fast-1,xai,constraints-scheduling,2979,1830,4809,188.243495,True,1.0,grok-code-fast-1,constraints-scheduling,188.243495,True,0.8,True,188.243495 +e269aca4-75d8-41b0-bbd3-3226f107bec9,grok-4-0709,xai,configure-git-webserver,4506,755,5261,487.545781,False,0.0,grok-4-0709,configure-git-webserver,487.545781,False,0.0,False,487.545781 +a0031f01-6a37-4035-9c35-49eee635e5cb,claude-opus-4-1-20250805,anthropic,run-pdp11-code,8755,6946,15701,565.655216,False,0.0,claude-opus-4-1-20250805,run-pdp11-code,565.655216,False,0.0,False,565.655216 +6817506c-b19f-43fe-8762-be6d6931f15b,gpt-5,openai,fix-code-vulnerability,8569,7694,16263,901.991962,False,0.0,gpt-5,fix-code-vulnerability,901.991962,False,0.0,False,901.991962 +a4617cbf-b644-41e7-be2b-004a9c17e855,grok-code-fast-1,xai,sqlite-with-gcov,4695,1274,5969,414.154419,True,1.0,grok-code-fast-1,sqlite-with-gcov,414.154419,True,0.2,True,414.154419 +0bd9dc97-39fb-44b8-81bd-e2e101ee0ac2,claude-opus-4-1-20250805,anthropic,nginx-request-logging,4530,2067,6597,383.576773,True,1.0,claude-opus-4-1-20250805,nginx-request-logging,383.576773,True,1.0,True,383.576773 +7f0a2b99-0418-45e8-ba35-b3a6329fc9a0,claude-opus-4-1-20250805,anthropic,sanitize-git-repo,19159,4381,23540,739.137696,False,0.0,claude-opus-4-1-20250805,sanitize-git-repo,739.137696,False,0.0,False,739.137696 +1ee1a670-cbb8-4ae4-a2d1-8d889395b622,moonshotai/Kimi-K2-Instruct-0905,together_ai,crack-7z-hash,9500,4308,13808,406.804382,True,1.0,moonshotai/Kimi-K2-Instruct-0905,crack-7z-hash,406.804382,True,1.0,True,406.804382 +bc56cbdc-25b6-4c67-ae2d-711c9dab8f69,grok-code-fast-1,xai,git-leak-recovery,1156,648,1804,35.950961,False,0.0,grok-code-fast-1,git-leak-recovery,35.950961,False,0.2,False,35.950961 +f345537c-9e8e-4dbe-a16f-4dd271c4fb7c,claude-opus-4-1-20250805,anthropic,model-extraction-relu-logits,5898,5237,11135,592.310242,False,0.0,claude-opus-4-1-20250805,model-extraction-relu-logits,592.310242,False,0.0,False,592.310242 +0717b99f-9080-436a-b518-d32c2d0d77d0,gemini-2.5-flash,gemini,merge-diff-arc-agi-task,9717,4341,14058,905.608288,False,0.0,gemini-2.5-flash,merge-diff-arc-agi-task,905.608288,False,0.0,False,905.608288 +881fae9e-c548-4717-acdd-31c16fa7e373,gpt-5-mini,openai,train-fasttext,14317,13488,27805,3624.579383,False,0.0,gpt-5-mini,train-fasttext,3624.579383,False,0.0,False,3624.579383 +db3d4068-02d0-4976-824b-0fc251c20940,gemini-2.5-flash,gemini,mteb-retrieve,2214,884,3098,125.761679,False,0.0,gemini-2.5-flash,mteb-retrieve,125.761679,False,0.0,False,125.761679 +c4ff3e74-a8c1-42a2-9c4a-fdcd281ae138,gpt-5-nano,openai,polyglot-c-py,2388,2566,4954,963.991313,False,0.0,gpt-5-nano,polyglot-c-py,963.991313,False,0.0,False,963.991313 +6188bac0-4578-4117-a337-68845fdbf8f6,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-git,6028,3949,9977,319.100462,True,1.0,moonshotai/Kimi-K2-Instruct-0905,fix-git,319.100462,True,1.0,True,319.100462 +d2d868ce-b51e-465d-baca-98bfe4a941af,gemini-2.5-pro,gemini,sqlite-with-gcov,7837,1444,9281,329.945283,True,1.0,gemini-2.5-pro,sqlite-with-gcov,329.945283,True,0.8,True,329.945283 +043b8d8f-829a-4edd-b60a-5749ba6f787e,gpt-5,openai,large-scale-text-editing,2367,2336,4703,488.383421,False,0.0,gpt-5,large-scale-text-editing,488.383421,False,0.4285714285714285,False,488.383421 +22699437-2c5d-41f4-8c26-e5a4d135c7a1,zai-org/GLM-4.5-Air-FP8,together_ai,reshard-c4-data,11704,9506,21210,900.021343,False,0.0,zai-org/GLM-4.5-Air-FP8,reshard-c4-data,900.021343,False,0.0,False,900.021343 +4dbe1823-00d9-4988-a879-f62258452369,OpenAI/gpt-oss-20B,together_ai,crack-7z-hash,999,519,1518,36.760144,False,0.0,OpenAI/gpt-oss-20B,crack-7z-hash,36.760144,False,0.0,False,36.760144 +96a421ff-33c8-4354-b3e4-d1f524d69d4e,claude-opus-4-1-20250805,anthropic,sqlite-with-gcov,9357,1639,10996,523.373141,False,0.0,claude-opus-4-1-20250805,sqlite-with-gcov,523.373141,False,0.5714285714285714,False,523.373141 +5356da93-6806-4a5e-9ab2-9acf4ad08a2d,grok-4-0709,xai,sqlite-with-gcov,7737,1730,9467,441.053005,False,0.0,grok-4-0709,sqlite-with-gcov,441.053005,False,0.0,False,441.053005 +aaec1464-2e89-40a3-9cd5-51bf80b9067c,claude-opus-4-1-20250805,anthropic,sparql-university,4435,1073,5508,1065.074529,False,0.0,claude-opus-4-1-20250805,sparql-university,1065.074529,False,0.0,False,1065.074529 +f498dc16-86fc-4746-a99f-066aa5c8f3d7,moonshotai/Kimi-K2-Instruct-0905,together_ai,write-compressor,6105,7016,13121,902.347031,False,0.0,moonshotai/Kimi-K2-Instruct-0905,write-compressor,902.347031,False,0.0,False,902.347031 +efeacfb3-e638-4c44-8d65-015f25a4ea31,grok-4-0709,xai,merge-diff-arc-agi-task,8296,2403,10699,888.551456,True,1.0,grok-4-0709,merge-diff-arc-agi-task,888.551456,True,0.4,True,888.551456 +cf78898e-2bfa-4a22-a682-d9f05c9fa5b9,gemini-2.5-pro,gemini,build-pmars,11733,3367,15100,387.223245,True,1.0,gemini-2.5-pro,build-pmars,387.223245,True,1.0,True,387.223245 +36fc82e0-4a1a-4e1d-b1cb-0a06218551e4,zai-org/GLM-4.5-Air-FP8,together_ai,build-cython-ext,16387,8441,24828,595.879952,False,0.0,zai-org/GLM-4.5-Air-FP8,build-cython-ext,595.879952,False,0.0,False,595.879952 +493edcad-28c1-4f3c-b613-13748ee6b73f,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,make-doom-for-mips,14397,3567,17964,900.025507,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,make-doom-for-mips,900.025507,False,0.0,False,900.025507 +f559401c-c22f-43a9-ba03-1ab5a3a21e6c,claude-sonnet-4-20250514,anthropic,fix-code-vulnerability,6037,1438,7475,948.347104,False,0.0,claude-sonnet-4-20250514,fix-code-vulnerability,948.347104,False,0.8,False,948.347104 +da48ae58-d3f0-4173-bf81-193cde60cf3c,claude-sonnet-4-20250514,anthropic,port-compressor,51254,33117,84371,3600.007842,False,0.0,claude-sonnet-4-20250514,port-compressor,3600.007842,False,0.2,False,3600.007842 +63b58936-d21f-4de1-a68f-09b47b2b76e2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-git,3019,2411,5430,513.804644,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-git,513.804644,True,1.0,True,513.804644 +a0a4ac18-58f9-4ee7-a142-eab0573b351e,claude-opus-4-1-20250805,anthropic,sparql-university,4677,1768,6445,59.700205,False,0.0,claude-opus-4-1-20250805,sparql-university,59.700205,False,0.0,False,59.700205 +af66c2c3-feaf-47d2-925c-2906af9af0c6,claude-opus-4-1-20250805,anthropic,port-compressor,61095,46130,107225,3600.040973,False,0.0,claude-opus-4-1-20250805,port-compressor,3600.040973,False,0.0,False,3600.040973 +1d481c69-4d91-4a84-8618-67724ddf70a7,openai/gpt-oss-120b,together_ai,code-from-image,5941,3298,9239,175.473043,False,0.0,openai/gpt-oss-120b,code-from-image,175.473043,False,0.0,False,175.473043 +8461b0ef-4b34-470b-a195-ef7d0357f164,claude-opus-4-1-20250805,anthropic,tune-mjcf,15423,12703,28126,900.200375,False,0.0,claude-opus-4-1-20250805,tune-mjcf,900.200375,False,0.25,False,900.200375 +fed0226a-8ea0-4871-8033-7aa26322c6c8,OpenAI/gpt-oss-20B,together_ai,log-summary-date-ranges,282,1306,1588,52.304569,False,0.0,OpenAI/gpt-oss-20B,log-summary-date-ranges,52.304569,False,0.0,False,52.304569 +49b9ab9d-3d94-465a-a132-6e4c59abf7f7,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,cancel-async-tasks,1137,495,1632,101.953262,True,1.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,cancel-async-tasks,101.953262,True,0.8,True,101.953262 +a875fca5-bec3-4a26-8344-a936d8ffc665,claude-sonnet-4-20250514,anthropic,train-fasttext,27664,10327,37991,3600.344847,False,0.0,claude-sonnet-4-20250514,train-fasttext,3600.344847,False,0.0,False,3600.344847 +81696cee-aec4-41fb-a3da-1a2d256a8171,claude-sonnet-4-20250514,anthropic,pypi-server,7457,4478,11935,615.918587,True,1.0,claude-sonnet-4-20250514,pypi-server,615.918587,True,0.8,True,615.918587 +35e11fab-812d-4161-83f1-ab8c80a0f4e3,gemini-2.5-pro,gemini,qemu-startup,1196,1317,2513,214.303761,False,0.0,gemini-2.5-pro,qemu-startup,214.303761,False,0.2,False,214.303761 +d9d9cfc4-805c-44ad-adb4-f5f469253c62,gpt-5-mini,openai,pytorch-model-cli,2072,2033,4105,264.966923,False,0.0,gpt-5-mini,pytorch-model-cli,264.966923,False,0.0,False,264.966923 +b6210482-43ce-4deb-b079-6a454fb2009e,gpt-5-nano,openai,count-dataset-tokens,9565,5722,15287,904.839144,False,0.0,gpt-5-nano,count-dataset-tokens,904.839144,False,0.0,False,904.839144 +10ca91fd-31f4-4ef3-a567-3932041a0352,grok-code-fast-1,xai,cancel-async-tasks,1350,648,1998,66.96576,False,0.0,grok-code-fast-1,cancel-async-tasks,66.96576,False,0.2,False,66.96576 +da53f72c-0961-4c90-9fcb-bc6427559a75,OpenAI/gpt-oss-20B,together_ai,gpt2-codegolf,2721,6339,9060,902.115949,False,0.0,OpenAI/gpt-oss-20B,gpt2-codegolf,902.115949,False,0.0,False,902.115949 +209be4c8-0bd3-4dba-a270-f2f26f4b9d4a,claude-sonnet-4-20250514,anthropic,write-compressor,2552,1386,3938,1416.858009,False,0.0,claude-sonnet-4-20250514,write-compressor,1416.858009,False,0.0,False,1416.858009 +32e2e69d-dc92-4a8b-9a81-a4c0b704b038,grok-code-fast-1,xai,openssl-selfsigned-cert,2007,1020,3027,42.709974,False,0.0,grok-code-fast-1,openssl-selfsigned-cert,42.709974,False,0.2,False,42.709974 +6bcf674f-bb23-4e8a-8097-7e4e619ee316,gpt-5-mini,openai,train-fasttext,15318,19235,34553,3615.210222,False,0.0,gpt-5-mini,train-fasttext,3615.210222,False,0.0,False,3615.210222 +b6680e56-4e5d-4989-a83e-94870532d35e,gemini-2.5-pro,gemini,feal-linear-cryptanalysis,17570,19433,37003,1810.216043,False,0.0,gemini-2.5-pro,feal-linear-cryptanalysis,1810.216043,False,0.0,False,1810.216043 +17f63c08-b13d-4c5e-86c3-17aad69f9fa1,moonshotai/Kimi-K2-Instruct-0905,together_ai,schemelike-metacircular-eval,31732,32792,64524,1486.135572,False,0.0,moonshotai/Kimi-K2-Instruct-0905,schemelike-metacircular-eval,1486.135572,False,0.0,False,1486.135572 +c6f2cc08-9c24-4363-81ee-5b4493812064,deepseek-ai/DeepSeek-V3.1,together_ai,db-wal-recovery,8644,5910,14554,244.736084,False,0.0,deepseek-ai/DeepSeek-V3.1,db-wal-recovery,244.736084,False,0.0,False,244.736084 +123ff3ca-2c6c-41db-a9a7-079c21ea44ac,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-alpine-ssh,1622,1316,2938,127.505093,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-alpine-ssh,127.505093,False,0.0,False,127.505093 +e749f863-648d-454a-9b65-6e91bd21b961,gemini-2.5-flash,gemini,nginx-request-logging,3447,1139,4586,55.245023,False,0.0,gemini-2.5-flash,nginx-request-logging,55.245023,False,0.0,False,55.245023 +1028cb15-47a2-47ea-9725-da877b19afdc,gpt-5,openai,qemu-alpine-ssh,5838,2738,8576,797.312994,False,0.0,gpt-5,qemu-alpine-ssh,797.312994,False,0.1666666666666666,False,797.312994 +5e4c0b84-e784-4546-9881-c8dc44e5abb1,OpenAI/gpt-oss-20B,together_ai,install-klee-minimal,1611,1604,3215,233.394304,False,0.0,OpenAI/gpt-oss-20B,install-klee-minimal,233.394304,False,0.0,False,233.394304 +de79d0fe-4ad6-433e-960a-338a817b5739,gpt-5-mini,openai,financial-document-processor,4388,4175,8563,484.417215,False,0.0,gpt-5-mini,financial-document-processor,484.417215,False,0.0,False,484.417215 +01162b33-c7cb-4566-9660-b8fa4f34d8d6,moonshotai/Kimi-K2-Instruct-0905,together_ai,constraints-scheduling,5788,3773,9561,199.944679,False,0.0,moonshotai/Kimi-K2-Instruct-0905,constraints-scheduling,199.944679,False,0.6,False,199.944679 +56b6ccfa-b007-4cf4-965e-6d02ab8f80f1,grok-code-fast-1,xai,configure-git-webserver,4994,1262,6256,384.738326,False,0.0,grok-code-fast-1,configure-git-webserver,384.738326,False,0.0,False,384.738326 +b8636d76-e8f3-4ae2-a6d0-f85726172856,openai/gpt-oss-120b,together_ai,cobol-modernization,4546,2521,7067,124.369042,True,1.0,openai/gpt-oss-120b,cobol-modernization,124.369042,True,0.8,True,124.369042 +8611152e-9f91-407f-8eac-4ecee1ac7911,gpt-5-mini,openai,path-tracing,33224,31288,64512,1800.063195,False,0.0,gpt-5-mini,path-tracing,1800.063195,False,0.0,False,1800.063195 +b9cd2030-c82f-4307-bd16-b87826698f91,openai/gpt-oss-120b,together_ai,adaptive-rejection-sampler,4697,2490,7187,455.291343,False,0.0,openai/gpt-oss-120b,adaptive-rejection-sampler,455.291343,False,0.0,False,455.291343 +3630bc08-1f8a-4ba3-a7c0-53734ac59724,zai-org/GLM-4.5-Air-FP8,together_ai,prove-plus-comm,7834,11099,18933,867.81343,True,1.0,zai-org/GLM-4.5-Air-FP8,prove-plus-comm,867.81343,True,0.8,True,867.81343 +165dfcae-d81e-42d6-b04b-5290130548b3,openai/gpt-oss-120b,together_ai,git-leak-recovery,1606,1260,2866,108.627261,False,0.0,openai/gpt-oss-120b,git-leak-recovery,108.627261,False,0.2,False,108.627261 +0860a3c3-5625-49d1-90f8-dc9995c12d79,gpt-5-nano,openai,install-klee-minimal,6739,3333,10072,904.415734,False,0.0,gpt-5-nano,install-klee-minimal,904.415734,False,0.0,False,904.415734 +df4c9379-4877-41dd-9e37-8c26621bd71c,claude-opus-4-1-20250805,anthropic,write-compressor,12623,10824,23447,910.186991,False,0.0,claude-opus-4-1-20250805,write-compressor,910.186991,False,0.0,False,910.186991 +16f43645-c8a5-467c-b37b-1f43313e9ec4,claude-sonnet-4-20250514,anthropic,wasm-pipeline,4615,4668,9283,527.599633,True,1.0,claude-sonnet-4-20250514,wasm-pipeline,527.599633,True,0.6,True,527.599633 +69c5fa14-dca0-43e6-9729-ccd3d9ac5a6f,gemini-2.5-pro,gemini,password-recovery,7034,3625,10659,917.999784,False,0.0,gemini-2.5-pro,password-recovery,917.999784,False,0.0,False,917.999784 +18bffdab-4965-4fe7-90c1-bdfd01a67e02,moonshotai/Kimi-K2-Instruct-0905,together_ai,torch-tensor-parallelism,3112,2008,5120,418.578883,False,0.0,moonshotai/Kimi-K2-Instruct-0905,torch-tensor-parallelism,418.578883,False,0.0,False,418.578883 +1ec8d952-441b-4aec-870a-800b991c14d9,openai/gpt-oss-120b,together_ai,pypi-server,2475,896,3371,104.80126,True,1.0,openai/gpt-oss-120b,pypi-server,104.80126,True,0.4,True,104.80126 +adbc4e26-5096-4592-a5f7-7773a9a553a5,gpt-5,openai,adaptive-rejection-sampler,2654,9847,12501,900.075567,True,1.0,gpt-5,adaptive-rejection-sampler,900.075567,True,0.4,True,900.075567 +d2c4b380-05db-4bb7-a63a-0c01734eb850,grok-4-0709,xai,configure-git-webserver,4950,2019,6969,382.319631,False,0.0,grok-4-0709,configure-git-webserver,382.319631,False,0.0,False,382.319631 +2f0b151f-66dc-4251-bb94-24a1f84fa4d1,gemini-2.5-flash,gemini,fix-code-vulnerability,17850,13914,31764,805.724129,False,0.0,gemini-2.5-flash,fix-code-vulnerability,805.724129,False,0.0,False,805.724129 +f2aeee12-653d-43d5-8933-36a440239f2a,gpt-5-mini,openai,merge-diff-arc-agi-task,7037,5382,12419,979.610297,False,0.0,gpt-5-mini,merge-diff-arc-agi-task,979.610297,False,0.4,False,979.610297 +721d90f8-70b2-4531-9917-3920bb72ed12,openai/gpt-oss-120b,together_ai,pypi-server,2831,1317,4148,271.763319,False,0.0,openai/gpt-oss-120b,pypi-server,271.763319,False,0.4,False,271.763319 +b233acb8-c9ac-41b7-aa8f-5528feb90190,grok-code-fast-1,xai,build-pov-ray,11726,4833,16559,1342.738897,False,0.0,grok-code-fast-1,build-pov-ray,1342.738897,False,0.2,False,1342.738897 +05629046-aff2-4cbf-9d23-56a27678c9cd,claude-opus-4-1-20250805,anthropic,large-scale-text-editing,4282,2665,6947,630.958542,True,1.0,claude-opus-4-1-20250805,large-scale-text-editing,630.958542,True,0.6666666666666666,True,630.958542 +c4dbba28-aee0-47c5-b50b-b07b2d88c58d,OpenAI/gpt-oss-20B,together_ai,make-mips-interpreter,3121,13703,16824,2058.869895,False,0.0,OpenAI/gpt-oss-20B,make-mips-interpreter,2058.869895,False,0.0,False,2058.869895 +25cf14f0-7784-4aed-afdb-74274ce42929,moonshotai/Kimi-K2-Instruct-0905,together_ai,torch-tensor-parallelism,21525,9368,30893,900.025716,False,0.0,moonshotai/Kimi-K2-Instruct-0905,torch-tensor-parallelism,900.025716,False,0.0,False,900.025716 +df3c0244-2d9d-4197-a58d-aae134fb9012,gemini-2.5-pro,gemini,gpt2-codegolf,7350,9850,17200,876.970709,False,0.0,gemini-2.5-pro,gpt2-codegolf,876.970709,False,0.0,False,876.970709 +97ceaa3e-d5e3-4f47-ad94-42c699e3be23,grok-4-0709,xai,break-filter-js-from-html,2093,1940,4033,1200.040302,False,0.0,grok-4-0709,break-filter-js-from-html,1200.040302,False,0.0,False,1200.040302 +acc93131-ea29-4366-a99e-142fbf9e742c,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,feal-linear-cryptanalysis,8216,9904,18120,1246.268106,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,feal-linear-cryptanalysis,1246.268106,False,0.0,False,1246.268106 +f253e763-f23b-435b-b7cc-00e157c14410,OpenAI/gpt-oss-20B,together_ai,reverse-engineering,6424,21177,27601,1834.78771,False,0.0,OpenAI/gpt-oss-20B,reverse-engineering,1834.78771,False,0.0,False,1834.78771 +c9365468-fe97-4ae1-9c36-4a88b69a5628,claude-opus-4-1-20250805,anthropic,dna-insert,18600,4706,23306,375.049858,False,0.0,claude-opus-4-1-20250805,dna-insert,375.049858,False,0.0,False,375.049858 +18d0b7c5-7172-467c-aeb8-dde4158cc41d,gpt-5-nano,openai,run-pdp11-code,15374,11042,26416,1005.871915,False,0.0,gpt-5-nano,run-pdp11-code,1005.871915,False,0.0,False,1005.871915 +840db8a2-7621-4e12-937e-e4955c0d5a59,grok-code-fast-1,xai,openssl-selfsigned-cert,3383,3812,7195,259.329827,True,1.0,grok-code-fast-1,openssl-selfsigned-cert,259.329827,True,0.2,True,259.329827 +242354a3-1c59-42ee-a383-74088c08c2b3,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,dna-assembly,7044,2794,9838,119.754246,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,dna-assembly,119.754246,False,0.0,False,119.754246 +2bc6222f-959d-4abe-85ab-92eae12560b4,zai-org/GLM-4.5-Air-FP8,together_ai,winning-avg-corewars,14956,15220,30176,1660.27635,False,0.0,zai-org/GLM-4.5-Air-FP8,winning-avg-corewars,1660.27635,False,0.0,False,1660.27635 +ef2b94f2-8c1a-4541-9c6f-0d5dead5dca1,claude-sonnet-4-20250514,anthropic,fix-code-vulnerability,12125,5464,17589,801.179318,True,1.0,claude-sonnet-4-20250514,fix-code-vulnerability,801.179318,True,0.8,True,801.179318 +880c4b46-6ff8-47b3-be62-85063c9f4441,claude-opus-4-1-20250805,anthropic,polyglot-c-py,11318,7033,18351,527.587911,False,0.0,claude-opus-4-1-20250805,polyglot-c-py,527.587911,False,0.0,False,527.587911 +17383441-63c8-4da8-b4b7-4dacc9972b22,gpt-5-nano,openai,build-cython-ext,18722,9912,28634,960.328104,False,0.0,gpt-5-nano,build-cython-ext,960.328104,False,0.0,False,960.328104 +03fb3fff-1f8b-4416-bcbc-44a7974cd67f,moonshotai/Kimi-K2-Instruct-0905,together_ai,sqlite-db-truncate,6317,6952,13269,638.45709,False,0.0,moonshotai/Kimi-K2-Instruct-0905,sqlite-db-truncate,638.45709,False,0.0,False,638.45709 +93ab80c4-8742-4f21-8a56-77e20d3afef6,deepseek-ai/DeepSeek-V3.1,together_ai,constraints-scheduling,6100,4582,10682,212.512964,True,1.0,deepseek-ai/DeepSeek-V3.1,constraints-scheduling,212.512964,True,0.8,True,212.512964 +64883f75-7897-4421-b301-987f0bd30455,zai-org/GLM-4.5-Air-FP8,together_ai,extract-elf,15959,3469,19428,202.807915,True,1.0,zai-org/GLM-4.5-Air-FP8,extract-elf,202.807915,True,0.4,True,202.807915 +a5e241b7-ccf6-42cb-ad6f-e14b9467d228,deepseek-ai/DeepSeek-V3.1,together_ai,model-extraction-relu-logits,5936,3458,9394,321.638095,False,0.0,deepseek-ai/DeepSeek-V3.1,model-extraction-relu-logits,321.638095,False,0.2,False,321.638095 +796334c6-e835-43f4-89f1-61f3f311ad64,claude-opus-4-1-20250805,anthropic,schemelike-metacircular-eval,62984,65613,128597,2400.000996,False,0.0,claude-opus-4-1-20250805,schemelike-metacircular-eval,2400.000996,False,0.0,False,2400.000996 +d1be0bfc-4226-46a5-8467-44764d0f4b63,grok-4-0709,xai,sparql-university,4886,1261,6147,389.847928,False,0.0,grok-4-0709,sparql-university,389.847928,False,0.4,False,389.847928 +14bc30db-4bbd-4924-81ab-aff2e6a28629,moonshotai/Kimi-K2-Instruct-0905,together_ai,model-extraction-relu-logits,9905,7709,17614,493.51599,False,0.0,moonshotai/Kimi-K2-Instruct-0905,model-extraction-relu-logits,493.51599,False,0.4,False,493.51599 +6e732d84-7754-4fd3-9334-2f14417da6c3,gpt-5-mini,openai,regex-log,1543,949,2492,116.841801,True,1.0,gpt-5-mini,regex-log,116.841801,True,0.8,True,116.841801 +a3404e18-f6b0-4207-bd75-0b9a2b98dce9,gpt-5-nano,openai,wasm-pipeline,13642,10944,24586,902.398994,False,0.0,gpt-5-nano,wasm-pipeline,902.398994,False,0.0,False,902.398994 +4d1fc036-a982-4957-a335-fa14a1b685ec,gemini-2.5-flash,gemini,dna-assembly,15205,4169,19374,746.757306,False,0.0,gemini-2.5-flash,dna-assembly,746.757306,False,0.0,False,746.757306 +788f1075-8cd5-4b60-ae3d-e0ac40e8934c,grok-4-0709,xai,log-summary-date-ranges,13146,11517,24663,909.086372,False,0.0,grok-4-0709,log-summary-date-ranges,909.086372,False,0.0,False,909.086372 +dc54abb9-1199-4e64-a5e8-acac9461f2a2,claude-opus-4-1-20250805,anthropic,video-processing,5440,4776,10216,345.855149,False,0.0,claude-opus-4-1-20250805,video-processing,345.855149,False,0.0,False,345.855149 +60d33963-3c6e-46ee-8374-b89961aa210a,deepseek-ai/DeepSeek-V3.1,together_ai,largest-eigenval,4986,4383,9369,317.239354,False,0.0,deepseek-ai/DeepSeek-V3.1,largest-eigenval,317.239354,False,0.2,False,317.239354 +12e800fb-c1ee-45f8-8d7c-e5543f6ac8e1,OpenAI/gpt-oss-20B,together_ai,mteb-leaderboard,933,215,1148,4.127515,False,0.0,OpenAI/gpt-oss-20B,mteb-leaderboard,4.127515,False,0.0,False,4.127515 +7ec6ec4c-0d5a-4260-977b-0c0dc8e7f983,gpt-5-nano,openai,schemelike-metacircular-eval,3301,3219,6520,254.080905,False,0.0,gpt-5-nano,schemelike-metacircular-eval,254.080905,False,0.2,False,254.080905 +982f680a-a55a-4e5d-abf5-e152f7562d3d,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-code-vulnerability,16886,10447,27333,900.129505,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-code-vulnerability,900.129505,False,0.0,False,900.129505 +f370eed8-632b-4cc4-831e-4aeaaa26b316,grok-4-0709,xai,db-wal-recovery,2533,3366,5899,904.090081,False,0.0,grok-4-0709,db-wal-recovery,904.090081,False,0.2,False,904.090081 +8d444c6a-f2de-49ed-a52c-787b1a48ef4b,claude-opus-4-1-20250805,anthropic,reshard-c4-data,7615,7321,14936,580.075365,False,0.0,claude-opus-4-1-20250805,reshard-c4-data,580.075365,False,0.0,False,580.075365 +84c0a330-2689-4f7f-9b06-914d3f358b4e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,path-tracing,3593,3989,7582,620.858057,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,path-tracing,620.858057,False,0.0,False,620.858057 +b18ebde1-486f-498f-b12b-5bf7caf922c9,grok-4-0709,xai,sanitize-git-repo,886,369,1255,1012.415013,False,0.0,grok-4-0709,sanitize-git-repo,1012.415013,False,0.0,False,1012.415013 +4a33b7a6-70b5-42b3-a6d7-226993fdae2a,moonshotai/Kimi-K2-Instruct-0905,together_ai,run-pdp11-code,7241,5796,13037,1000.030553,False,0.0,moonshotai/Kimi-K2-Instruct-0905,run-pdp11-code,1000.030553,False,0.0,False,1000.030553 +7c4b329b-fcb9-4c02-b624-f14c79413f6c,claude-opus-4-1-20250805,anthropic,make-doom-for-mips,11803,2362,14165,900.000987,False,0.0,claude-opus-4-1-20250805,make-doom-for-mips,900.000987,False,0.0,False,900.000987 +1d75e94e-40ad-4571-8ae4-d65e60c2a718,deepseek-ai/DeepSeek-V3.1,together_ai,vulnerable-secret,7294,5329,12623,911.703471,False,0.0,deepseek-ai/DeepSeek-V3.1,vulnerable-secret,911.703471,False,0.4,False,911.703471 +538ab4e3-24e2-442f-9a5c-640189bd2e46,claude-opus-4-1-20250805,anthropic,qemu-alpine-ssh,2792,3408,6200,512.544333,True,1.0,claude-opus-4-1-20250805,qemu-alpine-ssh,512.544333,True,0.8571428571428571,True,512.544333 +b0f55a03-e631-47a9-b558-62a7d7b55c2a,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,model-extraction-relu-logits,7575,6593,14168,498.651982,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,model-extraction-relu-logits,498.651982,False,0.0,False,498.651982 +f21a3760-fafb-4596-a9bf-846b1afa2ce4,claude-opus-4-1-20250805,anthropic,feal-linear-cryptanalysis,28836,29654,58490,1814.22546,False,0.0,claude-opus-4-1-20250805,feal-linear-cryptanalysis,1814.22546,False,0.0,False,1814.22546 +eb846e6b-ae92-477d-97d0-31a0aa87ef36,zai-org/GLM-4.5-Air-FP8,together_ai,cobol-modernization,12783,12659,25442,922.902224,False,0.0,zai-org/GLM-4.5-Air-FP8,cobol-modernization,922.902224,False,0.4,False,922.902224 +2046ff37-8d79-4b3a-b92d-f6d75afe18e6,claude-sonnet-4-20250514,anthropic,prove-plus-comm,1910,1712,3622,198.77971,True,1.0,claude-sonnet-4-20250514,prove-plus-comm,198.77971,True,1.0,True,198.77971 +dd85c226-f2b7-46f2-9d89-3de1e09421f7,deepseek-ai/DeepSeek-V3.1,together_ai,polyglot-rust-c,10657,11650,22307,907.601446,False,0.0,deepseek-ai/DeepSeek-V3.1,polyglot-rust-c,907.601446,False,0.0,False,907.601446 +d7b1e31f-03e9-40af-b22a-431764db7c95,OpenAI/gpt-oss-20B,together_ai,winning-avg-corewars,294,434,728,85.712986,False,0.0,OpenAI/gpt-oss-20B,winning-avg-corewars,85.712986,False,0.0,False,85.712986 +1214de4f-0f26-4299-98c6-a6466657c114,grok-4-0709,xai,train-fasttext,18654,7861,26515,3600.00844,False,0.0,grok-4-0709,train-fasttext,3600.00844,False,0.2,False,3600.00844 +8bbcd39e-a612-430e-8ceb-b9625fe25c1c,gpt-5-nano,openai,largest-eigenval,8301,7496,15797,901.424654,False,0.0,gpt-5-nano,largest-eigenval,901.424654,False,0.0,False,901.424654 +6834953e-7cff-43f5-88c4-5a6610030470,moonshotai/Kimi-K2-Instruct-0905,together_ai,build-initramfs-qemu,4971,5677,10648,528.755006,False,0.0,moonshotai/Kimi-K2-Instruct-0905,build-initramfs-qemu,528.755006,False,0.0,False,528.755006 +b6771c15-4778-4be2-80c1-bf3d36e89dc1,gemini-2.5-pro,gemini,path-tracing,2584,2076,4660,406.604805,False,0.0,gemini-2.5-pro,path-tracing,406.604805,False,0.0,False,406.604805 +8d802c65-2d3d-4405-95cd-41887a0e4ac6,openai/gpt-oss-120b,together_ai,path-tracing-reverse,13396,19616,33012,1829.715037,False,0.0,openai/gpt-oss-120b,path-tracing-reverse,1829.715037,False,0.0,False,1829.715037 +d2d30452-33d6-4e06-92cb-c7e671f1c114,grok-4-0709,xai,pytorch-model-cli,8974,4527,13501,767.715527,True,1.0,grok-4-0709,pytorch-model-cli,767.715527,True,0.6,True,767.715527 +1e9984ca-4e75-408f-b262-ecf4800fe727,gpt-5-mini,openai,constraints-scheduling,4306,7612,11918,461.605981,True,1.0,gpt-5-mini,constraints-scheduling,461.605981,True,0.8,True,461.605981 +c3faf798-b109-4f60-acf0-434a79257b56,claude-opus-4-1-20250805,anthropic,feal-linear-cryptanalysis,13951,20190,34141,1803.415785,False,0.0,claude-opus-4-1-20250805,feal-linear-cryptanalysis,1803.415785,False,0.0,False,1803.415785 +2438e67f-0d78-4bea-b8a5-0e5c24eecc4d,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,fix-git,5627,3105,8732,272.848379,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,fix-git,272.848379,True,1.0,True,272.848379 +47a91cbb-d396-4a7f-afed-8bdfb316a431,gpt-5,openai,filter-js-from-html,2007,2616,4623,124.138036,False,0.0,gpt-5,filter-js-from-html,124.138036,False,0.0,False,124.138036 +4aa51b5d-590b-4b70-95b9-932dd4828580,grok-code-fast-1,xai,build-pmars,26337,7205,33542,921.134999,False,0.0,grok-code-fast-1,build-pmars,921.134999,False,0.8,False,921.134999 +bf5a5972-1e5b-4999-8849-95938f9e85ff,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,reshard-c4-data,6869,4551,11420,279.981902,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,reshard-c4-data,279.981902,False,0.0,False,279.981902 +6a0c7800-5ac9-4494-b557-27455630fba1,gpt-5,openai,winning-avg-corewars,23617,12886,36503,1408.781807,False,0.0,gpt-5,winning-avg-corewars,1408.781807,False,0.2857142857142857,False,1408.781807 +e88e3d91-35af-425a-b81a-9f6d4a6c662a,grok-code-fast-1,xai,install-windows-3.11,6668,2463,9131,194.912933,False,0.0,grok-code-fast-1,install-windows-3.11,194.912933,False,0.0,False,194.912933 +58b84e9a-c6b1-432f-9154-39c16c5c6c4e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,tune-mjcf,6379,5214,11593,903.975567,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,tune-mjcf,903.975567,False,0.0,False,903.975567 +4c87580d-0abf-4283-b736-01f5cbf60a14,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-insert,8044,4104,12148,361.154423,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-insert,361.154423,False,0.0,False,361.154423 +ea5c814f-e991-49a6-9c5f-8730cf12e4fe,claude-opus-4-1-20250805,anthropic,largest-eigenval,10699,5971,16670,1507.487635,False,0.0,claude-opus-4-1-20250805,largest-eigenval,1507.487635,False,0.25,False,1507.487635 +2050eb82-ad25-44a6-b1c7-f90f113f823d,OpenAI/gpt-oss-20B,together_ai,sqlite-db-truncate,494,1105,1599,134.062386,False,0.0,OpenAI/gpt-oss-20B,sqlite-db-truncate,134.062386,False,0.0,False,134.062386 +294b6bf2-112b-46fd-8f94-3d053acd45ca,gpt-5,openai,configure-git-webserver,5897,2171,8068,686.346796,True,1.0,gpt-5,configure-git-webserver,686.346796,True,1.0,True,686.346796 +effe30ab-2890-475b-ade0-263e7ea87865,claude-opus-4-1-20250805,anthropic,db-wal-recovery,7597,5975,13572,1003.965977,False,0.0,claude-opus-4-1-20250805,db-wal-recovery,1003.965977,False,0.0,False,1003.965977 +a999cabe-63c6-498f-901b-1c6bf92f713d,zai-org/GLM-4.5-Air-FP8,together_ai,adaptive-rejection-sampler,14149,15262,29411,912.631231,False,0.0,zai-org/GLM-4.5-Air-FP8,adaptive-rejection-sampler,912.631231,False,0.0,False,912.631231 +0e50d050-c6a4-4b9d-b09c-c69a3dc137b1,gemini-2.5-pro,gemini,regex-log,1240,726,1966,107.855917,False,0.0,gemini-2.5-pro,regex-log,107.855917,False,0.8,False,107.855917 +2066effb-4566-4842-b5a4-fd59b2d34d01,gpt-5,openai,hf-model-inference,3426,1620,5046,441.130385,True,1.0,gpt-5,hf-model-inference,441.130385,True,1.0,True,441.130385 +6d020c64-9f1a-4787-981b-809db23d7fe4,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,tune-mjcf,11512,6421,17933,912.085006,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,tune-mjcf,912.085006,False,0.0,False,912.085006 +312e49dc-7896-4864-a075-c1ddb7717349,grok-4-0709,xai,install-windows-3.11,5801,2307,8108,342.682359,False,0.0,grok-4-0709,install-windows-3.11,342.682359,False,0.0,False,342.682359 +b0d9a714-3594-415d-98b4-a57b2e740f26,gpt-5-mini,openai,sqlite-db-truncate,3911,3310,7221,277.396603,False,0.0,gpt-5-mini,sqlite-db-truncate,277.396603,False,0.0,False,277.396603 +fc1d4edc-8bc6-4ce9-bfa4-9f090bc483af,gpt-5,openai,dna-assembly,9113,10438,19551,747.223056,False,0.0,gpt-5,dna-assembly,747.223056,False,0.0,False,747.223056 +c0486381-bd53-4051-b66c-973c25422379,zai-org/GLM-4.5-Air-FP8,together_ai,filter-js-from-html,13098,14198,27296,900.773719,False,0.0,zai-org/GLM-4.5-Air-FP8,filter-js-from-html,900.773719,False,0.0,False,900.773719 +cafdbbf5-ede2-433a-99a2-62361ceb0346,claude-opus-4-1-20250805,anthropic,pypi-server,6517,2828,9345,486.381509,True,1.0,claude-opus-4-1-20250805,pypi-server,486.381509,True,1.0,True,486.381509 +cc99d103-67e7-4e3d-97d9-5d9b31b0f706,openai/gpt-oss-120b,together_ai,build-pmars,5952,4518,10470,904.576425,False,0.0,openai/gpt-oss-120b,build-pmars,904.576425,False,0.2,False,904.576425 +496cbc61-7ef3-420e-8263-34a5b82b2108,moonshotai/Kimi-K2-Instruct-0905,together_ai,fix-code-vulnerability,5186,1828,7014,1011.764671,False,0.0,moonshotai/Kimi-K2-Instruct-0905,fix-code-vulnerability,1011.764671,False,0.0,False,1011.764671 +cb6f4975-6a02-4803-b454-ea657ccb1af1,claude-opus-4-1-20250805,anthropic,feal-differential-cryptanalysis,30069,29467,59536,1813.928094,False,0.0,claude-opus-4-1-20250805,feal-differential-cryptanalysis,1813.928094,False,0.0,False,1813.928094 +0739d1f9-915a-4389-9bbc-fc4d35fab3ae,claude-opus-4-1-20250805,anthropic,fix-code-vulnerability,17812,6558,24370,563.285081,False,0.0,claude-opus-4-1-20250805,fix-code-vulnerability,563.285081,False,0.125,False,563.285081 +69e538e2-a590-4f11-bdbf-8ca774e0142d,OpenAI/gpt-oss-20B,together_ai,extract-elf,1086,1104,2190,90.621321,True,1.0,OpenAI/gpt-oss-20B,extract-elf,90.621321,True,0.2,True,90.621321 +b2c829d1-b88a-413d-a414-3066eef23534,grok-code-fast-1,xai,large-scale-text-editing,2242,1247,3489,161.207289,False,0.0,grok-code-fast-1,large-scale-text-editing,161.207289,False,0.0,False,161.207289 +98fa7820-ed8e-40ce-ae49-ce33282431a3,grok-4-0709,xai,count-dataset-tokens,13909,3497,17406,908.854239,False,0.0,grok-4-0709,count-dataset-tokens,908.854239,False,0.0,False,908.854239 +4345f2dd-9537-4ff5-a854-f2482b6b02e8,gemini-2.5-pro,gemini,feal-linear-cryptanalysis,20776,21115,41891,1819.861515,False,0.0,gemini-2.5-pro,feal-linear-cryptanalysis,1819.861515,False,0.0,False,1819.861515 +311a2ea0-2081-4549-a236-3c90f0924f6a,deepseek-ai/DeepSeek-V3.1,together_ai,build-initramfs-qemu,10061,7472,17533,903.062251,False,0.0,deepseek-ai/DeepSeek-V3.1,build-initramfs-qemu,903.062251,False,0.0,False,903.062251 +10f9dfac-a456-43b2-9eae-3473912232e1,grok-code-fast-1,xai,write-compressor,11038,10710,21748,739.58549,False,0.0,grok-code-fast-1,write-compressor,739.58549,False,0.0,False,739.58549 +be880ce4-3ffb-45ea-b5a6-52c3879eb707,openai/gpt-oss-120b,together_ai,financial-document-processor,8461,8615,17076,786.169261,False,0.0,openai/gpt-oss-120b,financial-document-processor,786.169261,False,0.0,False,786.169261 +f7c6c392-41af-4392-a12c-23bbd3d24558,gpt-5,openai,fix-code-vulnerability,13016,11776,24792,900.000675,False,0.0,gpt-5,fix-code-vulnerability,900.000675,False,0.0,False,900.000675 +0f5d9b94-364b-448d-a937-dbd0629b05b1,claude-sonnet-4-20250514,anthropic,configure-git-webserver,12461,3984,16445,786.889597,True,1.0,claude-sonnet-4-20250514,configure-git-webserver,786.889597,True,0.6,True,786.889597 +06699cc0-3120-4981-b472-ea34cfb93287,gemini-2.5-flash,gemini,sqlite-db-truncate,3736,2642,6378,451.915077,False,0.0,gemini-2.5-flash,sqlite-db-truncate,451.915077,False,0.0,False,451.915077 +30afb470-d200-4ae2-a6a0-85ae6904c15c,deepseek-ai/DeepSeek-V3.1,together_ai,prove-plus-comm,2296,1574,3870,260.602416,True,1.0,deepseek-ai/DeepSeek-V3.1,prove-plus-comm,260.602416,True,1.0,True,260.602416 +4d4a065e-bf91-4603-8a7d-744900717927,gemini-2.5-pro,gemini,fix-ocaml-gc,33967,15398,49365,3600.001172,False,0.0,gemini-2.5-pro,fix-ocaml-gc,3600.001172,False,0.2,False,3600.001172 +8959f926-02d9-4785-afbf-4d15c5a990e4,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,financial-document-processor,19143,11586,30729,874.378545,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,financial-document-processor,874.378545,False,0.0,False,874.378545 +94ff821e-2677-4513-9a96-9738dd8271a9,openai/gpt-oss-120b,together_ai,pytorch-model-cli,1289,1335,2624,117.514224,False,0.0,openai/gpt-oss-120b,pytorch-model-cli,117.514224,False,0.0,False,117.514224 +3eacad70-53e6-47f6-97d1-0e61be9d806f,moonshotai/Kimi-K2-Instruct-0905,together_ai,crack-7z-hash,10334,4218,14552,598.225772,True,1.0,moonshotai/Kimi-K2-Instruct-0905,crack-7z-hash,598.225772,True,1.0,True,598.225772 +4630bdcf-0d0e-49f2-9e6a-4f89ec7959e6,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-initramfs-qemu,2034,1108,3142,226.543982,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-initramfs-qemu,226.543982,False,0.0,False,226.543982 +ce017748-368f-4b27-835a-f551abb9cc1d,deepseek-ai/DeepSeek-V3.1,together_ai,distribution-search,22632,20704,43336,1200.075023,False,0.0,deepseek-ai/DeepSeek-V3.1,distribution-search,1200.075023,False,0.0,False,1200.075023 +9b34ad22-6c18-4ff3-a2bd-29077c0ac4fa,grok-4-0709,xai,schemelike-metacircular-eval,6243,4780,11023,2406.90402,False,0.0,grok-4-0709,schemelike-metacircular-eval,2406.90402,False,0.0,False,2406.90402 +0a708b31-0c40-4b5a-a310-e245caca06b4,grok-4-0709,xai,code-from-image,7681,4194,11875,1205.949286,False,0.0,grok-4-0709,code-from-image,1205.949286,False,0.0,False,1205.949286 +7d2ac3a4-cb2d-4946-83ef-26fbd46733b9,claude-opus-4-1-20250805,anthropic,path-tracing-reverse,70764,55003,125767,1800.000681,False,0.0,claude-opus-4-1-20250805,path-tracing-reverse,1800.000681,False,0.0,False,1800.000681 +7aa22908-352c-455e-90ea-03d2da162882,claude-sonnet-4-20250514,anthropic,break-filter-js-from-html,9938,10426,20364,1204.815957,False,0.0,claude-sonnet-4-20250514,break-filter-js-from-html,1204.815957,False,0.0,False,1204.815957 +3f795318-9191-4fdb-83b4-88ead1e0d1c4,zai-org/GLM-4.5-Air-FP8,together_ai,bn-fit-modify,26254,24493,50747,2540.058613,False,0.0,zai-org/GLM-4.5-Air-FP8,bn-fit-modify,2540.058613,False,0.0,False,2540.058613 +84e09410-005e-4e47-97d7-8030f323b93c,gpt-5-nano,openai,model-extraction-relu-logits,1468,1147,2615,82.519475,False,0.0,gpt-5-nano,model-extraction-relu-logits,82.519475,False,0.0,False,82.519475 +be1cdc26-3239-42f8-849b-9c78e47d48a2,gpt-5-mini,openai,dna-assembly,14333,13263,27596,753.47746,False,0.0,gpt-5-mini,dna-assembly,753.47746,False,0.0,False,753.47746 +27a8702b-d1da-4726-a171-bc8d243b5976,claude-opus-4-1-20250805,anthropic,nginx-request-logging,4865,1548,6413,159.488286,True,1.0,claude-opus-4-1-20250805,nginx-request-logging,159.488286,True,1.0,True,159.488286 +1397f4e3-d908-4677-a0a3-afb6f942cb67,deepseek-ai/DeepSeek-V3.1,together_ai,make-doom-for-mips,19067,3273,22340,644.990417,False,0.0,deepseek-ai/DeepSeek-V3.1,make-doom-for-mips,644.990417,False,0.0,False,644.990417 +aae236ea-eb56-4b19-81e3-659dbdf2e053,gemini-2.5-pro,gemini,build-cython-ext,19021,5307,24328,807.617293,False,0.0,gemini-2.5-pro,build-cython-ext,807.617293,False,0.0,False,807.617293 +474fd036-e0d3-458a-b8db-33e23aecf0cb,claude-opus-4-1-20250805,anthropic,video-processing,3658,3002,6660,210.560505,False,0.0,claude-opus-4-1-20250805,video-processing,210.560505,False,0.0,False,210.560505 +85b372ee-f223-43a8-98a1-0a4dc1cb0344,zai-org/GLM-4.5-Air-FP8,together_ai,make-doom-for-mips,29034,5994,35028,904.991394,False,0.0,zai-org/GLM-4.5-Air-FP8,make-doom-for-mips,904.991394,False,0.0,False,904.991394 +57d50c78-45bc-4194-b71c-0c0c639f8783,deepseek-ai/DeepSeek-V3.1,together_ai,video-processing,4382,2629,7011,339.742443,False,0.0,deepseek-ai/DeepSeek-V3.1,video-processing,339.742443,False,0.0,False,339.742443 +a1cac633-be56-4e41-9681-7cdcbe606461,grok-4-0709,xai,qemu-alpine-ssh,1810,2204,4014,374.229161,False,0.0,grok-4-0709,qemu-alpine-ssh,374.229161,False,0.0,False,374.229161 +93d15a5e-3404-4214-b019-f6dc8234986b,openai/gpt-oss-120b,together_ai,db-wal-recovery,5293,5242,10535,1004.927055,False,0.0,openai/gpt-oss-120b,db-wal-recovery,1004.927055,False,0.0,False,1004.927055 +7487f5bc-9577-45cb-bf52-de7abb21f26b,deepseek-ai/DeepSeek-V3.1,together_ai,hf-model-inference,10002,3144,13146,594.03429,True,1.0,deepseek-ai/DeepSeek-V3.1,hf-model-inference,594.03429,True,0.8,True,594.03429 +58b0f697-532c-4f2f-9210-02e3f189022b,gemini-2.5-pro,gemini,largest-eigenval,6837,5214,12051,901.384442,False,0.0,gemini-2.5-pro,largest-eigenval,901.384442,False,0.0,False,901.384442 +d42cef3c-b8c4-42f2-8918-7f3aa1c6ce9e,gpt-5-mini,openai,fix-ocaml-gc,3197,7000,10197,3755.150004,False,0.0,gpt-5-mini,fix-ocaml-gc,3755.150004,False,0.0,False,3755.150004 +d9bc6c4a-5bd7-4ee1-a032-d56d5e72a6d9,claude-opus-4-1-20250805,anthropic,pypi-server,5609,2277,7886,189.164504,True,1.0,claude-opus-4-1-20250805,pypi-server,189.164504,True,1.0,True,189.164504 +793ee697-ef3b-4b0f-9016-e88a254d8fa0,claude-opus-4-1-20250805,anthropic,password-recovery,7264,3259,10523,1666.356108,False,0.0,claude-opus-4-1-20250805,password-recovery,1666.356108,False,0.5555555555555556,False,1666.356108 +88066c6f-9bb7-4901-aa6f-40c62f75d8db,zai-org/GLM-4.5-Air-FP8,together_ai,chess-best-move,8305,4728,13033,824.135439,False,0.0,zai-org/GLM-4.5-Air-FP8,chess-best-move,824.135439,False,0.0,False,824.135439 +3f115726-dbd1-4d21-8c8f-2a8352231d72,gpt-5-mini,openai,password-recovery,1802,3389,5191,1666.523669,False,0.0,gpt-5-mini,password-recovery,1666.523669,False,0.0,False,1666.523669 +366ae9a2-490f-4c39-a2a0-96addccc4369,gemini-2.5-flash,gemini,path-tracing,2052,1384,3436,193.685318,False,0.0,gemini-2.5-flash,path-tracing,193.685318,False,0.0,False,193.685318 +fd4a0bc6-f80c-4d9e-8eaf-9d8a22f3c02d,deepseek-ai/DeepSeek-V3.1,together_ai,schemelike-metacircular-eval,24219,21946,46165,1499.610287,False,0.0,deepseek-ai/DeepSeek-V3.1,schemelike-metacircular-eval,1499.610287,False,0.0,False,1499.610287 +0ea95bbc-03c8-4b6f-880a-5ce18bbf2ef3,grok-code-fast-1,xai,sqlite-db-truncate,7091,6634,13725,607.749307,False,0.0,grok-code-fast-1,sqlite-db-truncate,607.749307,False,0.0,False,607.749307 +5c3856ed-d43e-454c-b357-fce6cc12e5d2,OpenAI/gpt-oss-20B,together_ai,schemelike-metacircular-eval,281,578,859,48.781332,False,0.0,OpenAI/gpt-oss-20B,schemelike-metacircular-eval,48.781332,False,0.0,False,48.781332 +8d0298d5-b7ea-4f08-9d45-d5aedae90dff,gemini-2.5-pro,gemini,fix-git,2089,1218,3307,142.166775,True,1.0,gemini-2.5-pro,fix-git,142.166775,True,1.0,True,142.166775 +c0a69b8a-d68b-4619-82c3-119c751921d9,OpenAI/gpt-oss-20B,together_ai,distribution-search,159,1268,1427,128.520165,False,0.0,OpenAI/gpt-oss-20B,distribution-search,128.520165,False,0.0,False,128.520165 +422b814f-151b-4462-8cef-51b3e31e6772,gpt-5-nano,openai,feal-linear-cryptanalysis,23460,18988,42448,1801.318975,False,0.0,gpt-5-nano,feal-linear-cryptanalysis,1801.318975,False,0.0,False,1801.318975 +72e42d17-1f28-41be-a728-8c1dfb07c1a1,claude-opus-4-1-20250805,anthropic,chess-best-move,9711,8042,17753,578.983481,False,0.0,claude-opus-4-1-20250805,chess-best-move,578.983481,False,0.0,False,578.983481 +33e41779-9e60-4507-9a03-e1c45697ede4,gemini-2.5-pro,gemini,make-mips-interpreter,17529,14411,31940,1059.092077,False,0.0,gemini-2.5-pro,make-mips-interpreter,1059.092077,False,0.0,False,1059.092077 +13dfea1f-a6f0-4b8e-b051-7f844898b6df,claude-sonnet-4-20250514,anthropic,reverse-engineering,16993,14303,31296,1800.001568,False,0.0,claude-sonnet-4-20250514,reverse-engineering,1800.001568,False,0.0,False,1800.001568 +074a4b05-2421-4030-b5f8-f088add70539,moonshotai/Kimi-K2-Instruct-0905,together_ai,chess-best-move,10061,8979,19040,907.607489,False,0.0,moonshotai/Kimi-K2-Instruct-0905,chess-best-move,907.607489,False,0.0,False,907.607489 +174a95cd-d2b2-491a-add5-353b4ef89347,grok-code-fast-1,xai,db-wal-recovery,2823,2543,5366,160.907653,False,0.0,grok-code-fast-1,db-wal-recovery,160.907653,False,0.0,False,160.907653 +db9f55e6-862e-4cfd-a4c7-7314322cba78,gemini-2.5-pro,gemini,openssl-selfsigned-cert,3078,2570,5648,283.026972,True,1.0,gemini-2.5-pro,openssl-selfsigned-cert,283.026972,True,0.6,True,283.026972 +3afc8524-15b2-46d5-96b1-b150eafac367,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,bn-fit-modify,16860,9063,25923,2467.400514,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,bn-fit-modify,2467.400514,False,0.0,False,2467.400514 +b3efe4dd-ce98-4a5b-a1cd-95714af47bec,moonshotai/Kimi-K2-Instruct-0905,together_ai,openssl-selfsigned-cert,3592,3712,7304,633.796514,True,1.0,moonshotai/Kimi-K2-Instruct-0905,openssl-selfsigned-cert,633.796514,True,0.6,True,633.796514 +b13313d9-5438-46be-ae96-e0f67366f950,OpenAI/gpt-oss-20B,together_ai,build-cython-ext,1362,1395,2757,152.200359,False,0.0,OpenAI/gpt-oss-20B,build-cython-ext,152.200359,False,0.0,False,152.200359 +3a6c3eb0-95dc-4360-8a2b-5c704d3f01d3,gemini-2.5-flash,gemini,fix-ocaml-gc,53355,36248,89603,3612.833067,False,0.0,gemini-2.5-flash,fix-ocaml-gc,3612.833067,False,0.0,False,3612.833067 +9cc75497-c668-4dc6-81be-000a051c3d42,grok-code-fast-1,xai,build-pmars,17694,4329,22023,905.676879,True,1.0,grok-code-fast-1,build-pmars,905.676879,True,0.8,True,905.676879 +a0e604e0-a9f2-4f91-b814-79a5ef02240a,deepseek-ai/DeepSeek-V3.1,together_ai,torch-tensor-parallelism,4761,3770,8531,698.459332,False,0.0,deepseek-ai/DeepSeek-V3.1,torch-tensor-parallelism,698.459332,False,0.0,False,698.459332 +41a76398-04b5-4076-8560-be89f2676739,moonshotai/Kimi-K2-Instruct-0905,together_ai,gpt2-codegolf,15293,6303,21596,908.112842,False,0.0,moonshotai/Kimi-K2-Instruct-0905,gpt2-codegolf,908.112842,False,0.0,False,908.112842 +818a5974-2f0a-49e3-8f58-dec181eed745,moonshotai/Kimi-K2-Instruct-0905,together_ai,openssl-selfsigned-cert,3862,3637,7499,736.863069,True,1.0,moonshotai/Kimi-K2-Instruct-0905,openssl-selfsigned-cert,736.863069,True,0.6,True,736.863069 +bdc8892c-bbea-4564-a78a-4b678bf45e80,claude-sonnet-4-20250514,anthropic,vulnerable-secret,2628,2878,5506,936.769757,False,0.0,claude-sonnet-4-20250514,vulnerable-secret,936.769757,False,0.0,False,936.769757 +1ca88d95-8d7a-42b6-b3fe-1c68146b3437,gemini-2.5-flash,gemini,fix-git,7596,2959,10555,202.258595,True,1.0,gemini-2.5-flash,fix-git,202.258595,True,0.8,True,202.258595 +c1cd8367-2569-4465-955f-ee41cd766df5,gpt-5,openai,reshard-c4-data,2888,6803,9691,478.618469,False,0.0,gpt-5,reshard-c4-data,478.618469,False,0.3333333333333333,False,478.618469 +671d6d8a-184a-4e08-8294-a0394813d0a3,gemini-2.5-pro,gemini,filter-js-from-html,4024,6304,10328,452.584749,False,0.0,gemini-2.5-pro,filter-js-from-html,452.584749,False,0.0,False,452.584749 +f982da4b-04b2-4db7-83fc-467ad22d635d,OpenAI/gpt-oss-20B,together_ai,fix-git,1423,1008,2431,153.742197,False,0.0,OpenAI/gpt-oss-20B,fix-git,153.742197,False,0.2,False,153.742197 +f23c0e44-c9ff-4ec5-81b7-cb98e4f67cba,gemini-2.5-flash,gemini,crack-7z-hash,13523,4973,18496,792.182081,True,1.0,gemini-2.5-flash,crack-7z-hash,792.182081,True,0.8,True,792.182081 +c7cad823-9eff-4326-be3c-765f4cc43bd8,zai-org/GLM-4.5-Air-FP8,together_ai,wasm-pipeline,11824,8518,20342,508.230362,False,0.0,zai-org/GLM-4.5-Air-FP8,wasm-pipeline,508.230362,False,0.2,False,508.230362 +646e2c95-f660-4eb3-9687-cb2a9c9d1815,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,extract-elf,12234,5893,18127,775.699841,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,extract-elf,775.699841,True,0.6,True,775.699841 +b2dcf992-5e65-480b-83d8-c624b586164e,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,extract-elf,11619,5453,17072,651.489508,True,1.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,extract-elf,651.489508,True,0.6,True,651.489508 +e495ed63-5774-4d09-9924-8284d438715b,moonshotai/Kimi-K2-Instruct-0905,together_ai,dna-assembly,17114,12850,29964,618.855287,False,0.0,moonshotai/Kimi-K2-Instruct-0905,dna-assembly,618.855287,False,0.0,False,618.855287 +142df19c-8a95-4738-8be5-c698ac9d911a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,break-filter-js-from-html,2671,2295,4966,278.788817,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,break-filter-js-from-html,278.788817,False,0.0,False,278.788817 +031e87ef-51ef-49e5-8992-45ecda232b84,deepseek-ai/DeepSeek-V3.1,together_ai,video-processing,3971,3720,7691,377.818725,False,0.0,deepseek-ai/DeepSeek-V3.1,video-processing,377.818725,False,0.0,False,377.818725 +8bab85bc-7dd8-4a3a-98b8-a4050319f92b,zai-org/GLM-4.5-Air-FP8,together_ai,pypi-server,6687,4326,11013,504.888556,True,1.0,zai-org/GLM-4.5-Air-FP8,pypi-server,504.888556,True,0.2,True,504.888556 +7262a830-bc7f-4d42-8ed9-90bec1790942,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,model-extraction-relu-logits,1300,1970,3270,108.303099,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,model-extraction-relu-logits,108.303099,False,0.0,False,108.303099 +1cbdd164-b331-4539-8f4d-76ea079c3d6c,grok-4-0709,xai,run-pdp11-code,1995,2779,4774,2470.05237,False,0.0,grok-4-0709,run-pdp11-code,2470.05237,False,0.0,False,2470.05237 +ed4dfded-1486-4b8b-85d8-c50e61dbbe0b,gpt-5-mini,openai,run-pdp11-code,6699,3762,10461,1122.815201,False,0.0,gpt-5-mini,run-pdp11-code,1122.815201,False,0.0,False,1122.815201 +42506c05-0b8f-44c5-bdf9-471d096039eb,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,polyglot-c-py,11981,12235,24216,900.021209,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,polyglot-c-py,900.021209,False,0.0,False,900.021209 +d7e18913-fb5c-49a4-a3ed-6633139ee79b,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,pytorch-model-recovery,14928,7619,22547,902.05764,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,pytorch-model-recovery,902.05764,False,0.8,False,902.05764 +454bb4cd-caef-48d8-a10d-65d29963c25e,deepseek-ai/DeepSeek-V3.1,together_ai,code-from-image,16384,13011,29395,779.911904,True,1.0,deepseek-ai/DeepSeek-V3.1,code-from-image,779.911904,True,0.6,True,779.911904 +d372fa99-92ec-40e8-91ae-24a4d9357550,grok-code-fast-1,xai,large-scale-text-editing,2222,1497,3719,120.093058,False,0.0,grok-code-fast-1,large-scale-text-editing,120.093058,False,0.0,False,120.093058 +cb552c04-f6df-416e-b20c-da69d7ee8d92,grok-code-fast-1,xai,make-mips-interpreter,10507,15757,26264,1453.991861,False,0.0,grok-code-fast-1,make-mips-interpreter,1453.991861,False,0.0,False,1453.991861 +4f369f3f-2d33-40d5-9e31-ec17dabc3ae5,openai/gpt-oss-120b,together_ai,code-from-image,14799,15083,29882,741.887313,False,0.0,openai/gpt-oss-120b,code-from-image,741.887313,False,0.0,False,741.887313 +c18480b4-b3d9-413b-ba83-535f8945e605,claude-sonnet-4-20250514,anthropic,password-recovery,5135,5644,10779,900.889209,False,0.0,claude-sonnet-4-20250514,password-recovery,900.889209,False,0.4,False,900.889209 +3974277b-9ee3-49ba-95a3-e6ce60994f5b,gpt-5,openai,build-pov-ray,33383,39180,72563,6000.001667,False,0.0,gpt-5,build-pov-ray,6000.001667,False,0.0,False,6000.001667 +491fea6e-e16d-489a-b98b-4b61473c3046,claude-opus-4-1-20250805,anthropic,merge-diff-arc-agi-task,24908,16430,41338,905.178974,False,0.0,claude-opus-4-1-20250805,merge-diff-arc-agi-task,905.178974,False,0.3333333333333333,False,905.178974 +688961b2-6e1b-4b48-a3a4-a8fef9ac0a97,gpt-5-nano,openai,openssl-selfsigned-cert,2349,1824,4173,111.455464,True,1.0,gpt-5-nano,openssl-selfsigned-cert,111.455464,True,0.6,True,111.455464 +79b6aed7-befd-4e44-93b8-09d912819591,claude-opus-4-1-20250805,anthropic,sqlite-with-gcov,9861,1561,11422,263.510691,False,0.0,claude-opus-4-1-20250805,sqlite-with-gcov,263.510691,False,0.5714285714285714,False,263.510691 +0193f7f3-563d-4ca1-a35a-4b48ccbbe905,gpt-5,openai,db-wal-recovery,9836,10968,20804,915.504961,False,0.0,gpt-5,db-wal-recovery,915.504961,False,0.1428571428571428,False,915.504961 +1b46938a-eb1c-42da-83f1-cbc58b211bce,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,build-pmars,12047,3150,15197,352.270347,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,build-pmars,352.270347,False,0.2,False,352.270347 +8b3a085b-2cbb-4ca2-b074-f1b6685c76f8,gpt-5,openai,fix-code-vulnerability,2674,1787,4461,1018.416899,False,0.0,gpt-5,fix-code-vulnerability,1018.416899,False,0.0,False,1018.416899 +0bdb0a70-c7f4-4cde-b07c-2daea4655a40,gpt-5,openai,pytorch-model-recovery,11540,9823,21363,904.457709,True,1.0,gpt-5,pytorch-model-recovery,904.457709,True,0.4285714285714285,True,904.457709 +ceab9c91-1690-4a62-8f30-334eb48874d0,gemini-2.5-flash,gemini,winning-avg-corewars,18900,17935,36835,2630.333253,False,0.0,gemini-2.5-flash,winning-avg-corewars,2630.333253,False,0.0,False,2630.333253 +a83280f5-c068-456a-846a-06fc405c4110,claude-sonnet-4-20250514,anthropic,distribution-search,9264,8105,17369,554.83574,True,1.0,claude-sonnet-4-20250514,distribution-search,554.83574,True,0.6,True,554.83574 +2d148477-4c94-433f-acc4-13465f7906f0,grok-code-fast-1,xai,reshard-c4-data,5355,4084,9439,152.232057,False,0.0,grok-code-fast-1,reshard-c4-data,152.232057,False,0.0,False,152.232057 +e667f95a-a7d4-4822-a860-c719a3ad8e1d,gpt-5-mini,openai,qemu-startup,2587,3801,6388,437.319814,True,1.0,gpt-5-mini,qemu-startup,437.319814,True,0.8,True,437.319814 +ca3e0e83-4752-4c7c-8503-480d17fd56f6,gpt-5-nano,openai,train-fasttext,10778,15746,26524,3647.866614,False,0.0,gpt-5-nano,train-fasttext,3647.866614,False,0.0,False,3647.866614 +75d95b08-130a-4e4f-a448-07d75f0a19f6,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,distribution-search,11657,11468,23125,814.595259,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,distribution-search,814.595259,False,0.4,False,814.595259 +9eec53de-11ab-45ed-b74f-af37fde9e9fd,zai-org/GLM-4.5-Air-FP8,together_ai,code-from-image,7223,3626,10849,276.399463,True,1.0,zai-org/GLM-4.5-Air-FP8,code-from-image,276.399463,True,0.2,True,276.399463 +5271a0fb-d8d5-441d-9857-b2a21985fe9a,claude-sonnet-4-20250514,anthropic,dna-insert,4835,658,5493,502.79937,False,0.0,claude-sonnet-4-20250514,dna-insert,502.79937,False,0.0,False,502.79937 +1e2e71c0-1c83-46c4-88a9-59e58336cc96,OpenAI/gpt-oss-20B,together_ai,fix-git,1649,2039,3688,91.160401,True,1.0,OpenAI/gpt-oss-20B,fix-git,91.160401,True,0.2,True,91.160401 +dac4d51e-b35e-4398-99e6-6633dde32d0e,moonshotai/Kimi-K2-Instruct-0905,together_ai,regex-log,3351,2993,6344,303.677945,False,0.0,moonshotai/Kimi-K2-Instruct-0905,regex-log,303.677945,False,0.4,False,303.677945 +ee5c1bc9-dde1-4c01-9f47-65674d197acc,zai-org/GLM-4.5-Air-FP8,together_ai,build-pmars,9880,6056,15936,439.080494,True,1.0,zai-org/GLM-4.5-Air-FP8,build-pmars,439.080494,True,0.6,True,439.080494 +2292ab98-2e7a-4557-a861-3a55dc2f308c,OpenAI/gpt-oss-20B,together_ai,cancel-async-tasks,1014,1358,2372,42.635609,False,0.0,OpenAI/gpt-oss-20B,cancel-async-tasks,42.635609,False,0.0,False,42.635609 +b3e1734d-044b-432b-b8ef-8cfcb4f2b212,gemini-2.5-flash,gemini,path-tracing-reverse,31086,24956,56042,1239.350293,False,0.0,gemini-2.5-flash,path-tracing-reverse,1239.350293,False,0.0,False,1239.350293 +df091b11-f901-4785-9e12-343f5885e082,grok-4-0709,xai,financial-document-processor,7335,2520,9855,496.659992,False,0.0,grok-4-0709,financial-document-processor,496.659992,False,0.0,False,496.659992 +f53e27a8-4827-418c-9499-f5fbf86990b8,grok-4-0709,xai,path-tracing,2059,1749,3808,2025.897205,False,0.0,grok-4-0709,path-tracing,2025.897205,False,0.0,False,2025.897205 +96844e5c-2ba0-4a39-a429-c059b6188e1d,gpt-5-mini,openai,run-pdp11-code,10134,5338,15472,1028.420196,False,0.0,gpt-5-mini,run-pdp11-code,1028.420196,False,0.0,False,1028.420196 +3c42443c-6c5c-4293-a265-8e3096636f2c,grok-4-0709,xai,pypi-server,2816,2076,4892,491.081837,True,1.0,grok-4-0709,pypi-server,491.081837,True,0.4,True,491.081837 +2d301cdc-1a07-4ded-9057-ee70e030663b,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,sqlite-db-truncate,2528,2123,4651,190.971173,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,sqlite-db-truncate,190.971173,False,0.0,False,190.971173 +5572e163-9e93-4bae-936f-cf990fd45e3a,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,qemu-alpine-ssh,1714,1235,2949,102.067955,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,qemu-alpine-ssh,102.067955,False,0.0,False,102.067955 +03e0ce95-b78e-410e-a460-481644c3887a,claude-opus-4-1-20250805,anthropic,feal-linear-cryptanalysis,16767,23199,39966,1807.988643,False,0.0,claude-opus-4-1-20250805,feal-linear-cryptanalysis,1807.988643,False,0.0,False,1807.988643 +58cc0734-7551-4fbc-8ef3-acb1910588df,gemini-2.5-pro,gemini,db-wal-recovery,1775,3056,4831,900.031961,False,0.0,gemini-2.5-pro,db-wal-recovery,900.031961,False,0.0,False,900.031961 +5e7a9f58-deb8-4eee-bae4-40de303db202,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing-reverse,19532,6290,25822,1006.381626,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing-reverse,1006.381626,False,0.0,False,1006.381626 +3d48106b-4428-4b61-8344-5cfbb1654b17,grok-code-fast-1,xai,hf-model-inference,3614,897,4511,85.622256,False,0.0,grok-code-fast-1,hf-model-inference,85.622256,False,0.4,False,85.622256 +25bcc30c-935b-4b86-afde-8f6751dfdaf1,grok-code-fast-1,xai,git-leak-recovery,1458,1217,2675,214.798702,False,0.0,grok-code-fast-1,git-leak-recovery,214.798702,False,0.2,False,214.798702 +26f30ad3-b0e4-4531-939c-1c03f9d6dcdc,claude-opus-4-1-20250805,anthropic,db-wal-recovery,11495,8843,20338,904.844732,False,0.0,claude-opus-4-1-20250805,db-wal-recovery,904.844732,False,0.0,False,904.844732 +577ae939-0eb6-4bcd-b343-fe80131ef274,gpt-5-nano,openai,build-pmars,19038,16679,35717,917.995153,False,0.0,gpt-5-nano,build-pmars,917.995153,False,0.0,False,917.995153 +2bb45cc0-f0fc-4aba-bd12-b45ca6148f38,gpt-5,openai,train-fasttext,14445,9756,24201,3615.256775,False,0.0,gpt-5,train-fasttext,3615.256775,False,0.0,False,3615.256775 +9854421f-bc1a-4372-85fb-60f5ebdfe4fd,moonshotai/Kimi-K2-Instruct-0905,together_ai,count-dataset-tokens,9639,3395,13034,322.131671,False,0.0,moonshotai/Kimi-K2-Instruct-0905,count-dataset-tokens,322.131671,False,0.2,False,322.131671 +b9dc9fdd-9255-4966-9a0a-bff97c3b2d59,openai/gpt-oss-120b,together_ai,git-leak-recovery,1474,1357,2831,196.66383,False,0.0,openai/gpt-oss-120b,git-leak-recovery,196.66383,False,0.2,False,196.66383 +44a66d1e-0f6f-447f-a588-2a6cbf046105,gpt-5,openai,qemu-alpine-ssh,782,909,1691,999.167004,False,0.0,gpt-5,qemu-alpine-ssh,999.167004,False,0.1666666666666666,False,999.167004 +3a829fcb-6d95-440f-a000-9974dc4829f9,gpt-5-nano,openai,count-dataset-tokens,6503,6662,13165,907.80398,False,0.0,gpt-5-nano,count-dataset-tokens,907.80398,False,0.0,False,907.80398 +7242fe82-1dcb-4237-885d-e03b24c74654,gemini-2.5-flash,gemini,crack-7z-hash,10027,3878,13905,238.596896,True,1.0,gemini-2.5-flash,crack-7z-hash,238.596896,True,0.8,True,238.596896 +8562de32-7234-4140-bd24-bd6d836e7ab2,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,sanitize-git-repo,12321,3978,16299,924.262306,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,sanitize-git-repo,924.262306,False,0.0,False,924.262306 +9a8d8649-b56b-4fa3-b28b-00958cba7054,claude-sonnet-4-20250514,anthropic,install-klee-minimal,17356,2716,20072,900.070444,False,0.0,claude-sonnet-4-20250514,install-klee-minimal,900.070444,False,0.0,False,900.070444 +23a4a582-67c6-4159-883e-a943c3f75781,grok-4-0709,xai,openssl-selfsigned-cert,1821,1063,2884,200.871489,False,0.0,grok-4-0709,openssl-selfsigned-cert,200.871489,False,0.0,False,200.871489 +0c88fe40-f7c2-4887-8365-e1d1e04dc572,gemini-2.5-pro,gemini,fix-ocaml-gc,19465,6847,26312,1269.116548,True,1.0,gemini-2.5-pro,fix-ocaml-gc,1269.116548,True,0.2,True,1269.116548 +c0f03aa3-64b2-4172-bd3c-9018bd73faf9,deepseek-ai/DeepSeek-V3.1,together_ai,large-scale-text-editing,11453,10545,21998,1204.830639,False,0.0,deepseek-ai/DeepSeek-V3.1,large-scale-text-editing,1204.830639,False,0.0,False,1204.830639 +d2954d13-0729-4b1b-b746-c5e04668ebbe,gpt-5,openai,gpt2-codegolf,4226,5003,9229,906.57832,False,0.0,gpt-5,gpt2-codegolf,906.57832,False,0.0,False,906.57832 +d295bca6-dd0e-4cf3-893f-a7d8db6ef416,deepseek-ai/DeepSeek-V3.1,together_ai,reshard-c4-data,9399,4214,13613,800.145566,False,0.0,deepseek-ai/DeepSeek-V3.1,reshard-c4-data,800.145566,False,0.0,False,800.145566 +6e012eb7-7a30-4e79-a408-0add1d7eb526,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,break-filter-js-from-html,5574,6373,11947,1203.661381,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,break-filter-js-from-html,1203.661381,False,0.0,False,1203.661381 +9cc9746f-d489-4cef-895b-fd574f6efe79,gpt-5-nano,openai,fix-ocaml-gc,14537,5267,19804,3754.157715,False,0.0,gpt-5-nano,fix-ocaml-gc,3754.157715,False,0.0,False,3754.157715 +e56b2f2e-27e6-4ffb-b1f5-30fe3491bd10,grok-4-0709,xai,form-filling,4521,3228,7749,470.98634,False,0.0,grok-4-0709,form-filling,470.98634,False,0.2,False,470.98634 +21a45437-c1e3-4b72-b6ba-c4cd2f458c19,deepseek-ai/DeepSeek-V3.1,together_ai,tune-mjcf,7326,5720,13046,1046.321196,False,0.0,deepseek-ai/DeepSeek-V3.1,tune-mjcf,1046.321196,False,0.0,False,1046.321196 +9cb6db34-45e0-46be-b714-9a1b092c6ac6,gpt-5-nano,openai,wasm-pipeline,8594,7312,15906,912.719245,False,0.0,gpt-5-nano,wasm-pipeline,912.719245,False,0.0,False,912.719245 +c28cdaed-8325-4300-a093-0ee1246bdeec,claude-opus-4-1-20250805,anthropic,gpt2-codegolf,16287,14934,31221,1116.660261,False,0.0,claude-opus-4-1-20250805,gpt2-codegolf,1116.660261,False,0.0,False,1116.660261 +c03593c0-988e-4682-a474-725c9690b785,gpt-5-mini,openai,hf-model-inference,4542,2359,6901,505.853509,True,1.0,gpt-5-mini,hf-model-inference,505.853509,True,0.8,True,505.853509 +57c092f6-9f79-45c6-a4a0-caa7c8e4657c,grok-code-fast-1,xai,port-compressor,19890,14154,34044,1707.588556,False,0.0,grok-code-fast-1,port-compressor,1707.588556,False,0.0,False,1707.588556 +702a4368-6487-486b-ad1c-75dbeec4e270,moonshotai/Kimi-K2-Instruct-0905,together_ai,install-klee-minimal,15981,3088,19069,902.115913,False,0.0,moonshotai/Kimi-K2-Instruct-0905,install-klee-minimal,902.115913,False,0.0,False,902.115913 +6f5eaaad-ff22-4b2b-9a0a-e77d647a8b29,claude-sonnet-4-20250514,anthropic,prove-plus-comm,2108,1667,3775,124.80742,True,1.0,claude-sonnet-4-20250514,prove-plus-comm,124.80742,True,1.0,True,124.80742 +f7dffa74-2af0-4d70-8602-531047175d88,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,qemu-startup,5105,6661,11766,903.169268,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,qemu-startup,903.169268,False,0.0,False,903.169268 +e402da3a-9b92-434e-9998-c2e82ebb1611,grok-4-0709,xai,build-pmars,844,632,1476,2063.595934,False,0.0,grok-4-0709,build-pmars,2063.595934,False,0.2,False,2063.595934 +376a72cc-6c09-47c9-a9ec-e8317ea6b493,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,chess-best-move,5089,2837,7926,205.094775,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,chess-best-move,205.094775,False,0.0,False,205.094775 +1be10523-5c7d-4e16-8107-ea9159eaeadc,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,together_ai,vulnerable-secret,3172,3523,6695,142.002919,False,0.0,meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,vulnerable-secret,142.002919,False,0.0,False,142.002919 +7ff09eb3-af62-464f-971c-3fe7b1d141f4,gpt-5-mini,openai,build-pov-ray,6096,5605,11701,870.001616,False,0.0,gpt-5-mini,build-pov-ray,870.001616,False,0.0,False,870.001616 +b1dc7dfa-386d-41eb-b055-63d6479b5d81,gpt-5-mini,openai,build-pmars,12559,10445,23004,948.159392,False,0.0,gpt-5-mini,build-pmars,948.159392,False,0.2,False,948.159392 +bffcb8b2-e1a3-4c0e-85ef-ed3107738cb0,gpt-5-nano,openai,git-leak-recovery,7291,6194,13485,601.066027,False,0.0,gpt-5-nano,git-leak-recovery,601.066027,False,0.0,False,601.066027 +7a4207b9-7cea-453d-92db-0a29babefa85,gpt-5-mini,openai,circuit-fibsqrt,1994,2096,4090,109.78106,False,0.0,gpt-5-mini,circuit-fibsqrt,109.78106,False,0.0,False,109.78106 +66bfefa1-69b8-4e3f-9ee1-a37207314321,deepseek-ai/DeepSeek-V3.1,together_ai,build-pov-ray,17741,5396,23137,483.486725,True,1.0,deepseek-ai/DeepSeek-V3.1,build-pov-ray,483.486725,True,0.4,True,483.486725 +eadaa92e-92a2-4996-a15c-73d13b62624a,deepseek-ai/DeepSeek-V3.1,together_ai,qemu-alpine-ssh,2132,2365,4497,323.904361,False,0.0,deepseek-ai/DeepSeek-V3.1,qemu-alpine-ssh,323.904361,False,0.2,False,323.904361 +a8031f57-d582-45fb-8d75-88d73aeddbd8,gemini-2.5-pro,gemini,write-compressor,5923,6326,12249,904.423041,False,0.0,gemini-2.5-pro,write-compressor,904.423041,False,0.0,False,904.423041 +a676c26e-9136-409d-90ad-eed7566362db,moonshotai/Kimi-K2-Instruct-0905,together_ai,pypi-server,14235,5985,20220,761.406198,False,0.0,moonshotai/Kimi-K2-Instruct-0905,pypi-server,761.406198,False,0.2,False,761.406198 +dc0a9d42-a91d-4aa0-b2f2-77ae7469bc84,openai/gpt-oss-120b,together_ai,password-recovery,2054,5499,7553,409.378542,False,0.0,openai/gpt-oss-120b,password-recovery,409.378542,False,0.2,False,409.378542 +6052188c-823a-48ef-a026-17a9b0918138,zai-org/GLM-4.5-Air-FP8,together_ai,extract-elf,6080,2593,8673,375.939295,False,0.0,zai-org/GLM-4.5-Air-FP8,extract-elf,375.939295,False,0.4,False,375.939295 +e8444f28-f310-4040-9cb2-c61d2b17f419,grok-4-0709,xai,sqlite-db-truncate,1797,1269,3066,909.078122,False,0.0,grok-4-0709,sqlite-db-truncate,909.078122,False,0.0,False,909.078122 +7f58e472-5978-450a-b836-97b96ec69a30,OpenAI/gpt-oss-20B,together_ai,distribution-search,811,1738,2549,119.747625,False,0.0,OpenAI/gpt-oss-20B,distribution-search,119.747625,False,0.0,False,119.747625 +7f5a9e0f-6988-4683-bb2f-331b783fa8b9,deepseek-ai/DeepSeek-V3.1,together_ai,break-filter-js-from-html,3093,3351,6444,386.618178,False,0.0,deepseek-ai/DeepSeek-V3.1,break-filter-js-from-html,386.618178,False,0.0,False,386.618178 +b4ccc014-d359-43a0-bcfb-87db022f74d2,grok-code-fast-1,xai,qemu-alpine-ssh,1731,1238,2969,224.318987,False,0.0,grok-code-fast-1,qemu-alpine-ssh,224.318987,False,0.0,False,224.318987 +64c01cb1-74ce-4008-95e5-add099ff32d7,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,together_ai,code-from-image,13955,12085,26040,820.332866,False,0.0,Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,code-from-image,820.332866,False,0.2,False,820.332866 +35cf8209-eb58-483f-8dd5-c34a435cfeb0,openai/gpt-oss-120b,together_ai,build-cython-ext,12414,4385,16799,900.36206,False,0.0,openai/gpt-oss-120b,build-cython-ext,900.36206,False,0.0,False,900.36206 +4e9b5541-ab60-48df-a4ad-b1ad4daa74cb,OpenAI/gpt-oss-20B,together_ai,sqlite-db-truncate,257,1040,1297,140.089677,False,0.0,OpenAI/gpt-oss-20B,sqlite-db-truncate,140.089677,False,0.0,False,140.089677 +97b9c356-a088-49e4-8679-f381cf237400,gpt-5-nano,openai,sanitize-git-repo,19670,11606,31276,908.925051,False,0.0,gpt-5-nano,sanitize-git-repo,908.925051,False,0.0,False,908.925051 +0d745d79-1273-4963-820f-c40cec623d83,moonshotai/Kimi-K2-Instruct-0905,together_ai,path-tracing,5951,5806,11757,2035.562264,False,0.0,moonshotai/Kimi-K2-Instruct-0905,path-tracing,2035.562264,False,0.0,False,2035.562264 diff --git a/notebooks/total_avg_episodes_pipeline/results/model_total_statistics.csv b/notebooks/total_avg_episodes_pipeline/results/model_total_statistics.csv new file mode 100644 index 0000000..d379adf --- /dev/null +++ b/notebooks/total_avg_episodes_pipeline/results/model_total_statistics.csv @@ -0,0 +1,17 @@ +model_name,total_episodes,total_trials,successful_trials,success_rate +gpt-5,3102,444,152,0.34234234234234234 +claude-opus-4-1-20250805,11468,581,194,0.33390705679862304 +claude-sonnet-4-20250514,10346,368,108,0.29347826086956524 +gemini-2.5-pro,4995,369,100,0.27100271002710025 +deepseek-ai/DeepSeek-V3.1,8948,369,83,0.22493224932249323 +moonshotai/Kimi-K2-Instruct-0905,11594,373,80,0.21447721179624665 +grok-4-0709,3156,369,76,0.20596205962059622 +gpt-5-mini,2688,367,75,0.20435967302452315 +Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8,12467,373,68,0.18230563002680966 +openai/gpt-oss-120b,4169,365,54,0.14794520547945206 +zai-org/GLM-4.5-Air-FP8,10263,371,52,0.14016172506738545 +grok-code-fast-1,2646,371,49,0.1320754716981132 +gemini-2.5-flash,5992,371,44,0.11859838274932614 +gpt-5-nano,5114,369,33,0.08943089430894309 +meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8,4709,369,24,0.06504065040650407 +OpenAI/gpt-oss-20B,8250,370,8,0.021621621621621623 diff --git a/notebooks/total_avg_episodes_pipeline/results/total_avg_episodes_vs_success.pdf b/notebooks/total_avg_episodes_pipeline/results/total_avg_episodes_vs_success.pdf new file mode 100644 index 0000000..5ad3743 Binary files /dev/null and b/notebooks/total_avg_episodes_pipeline/results/total_avg_episodes_vs_success.pdf differ diff --git a/notebooks/total_avg_episodes_pipeline/results/total_avg_episodes_vs_success.png b/notebooks/total_avg_episodes_pipeline/results/total_avg_episodes_vs_success.png new file mode 100644 index 0000000..61725fa Binary files /dev/null and b/notebooks/total_avg_episodes_pipeline/results/total_avg_episodes_vs_success.png differ diff --git a/notebooks/total_avg_episodes_pipeline/total_avg_episodes_analysis.ipynb b/notebooks/total_avg_episodes_pipeline/total_avg_episodes_analysis.ipynb new file mode 100644 index 0000000..397ce91 --- /dev/null +++ b/notebooks/total_avg_episodes_pipeline/total_avg_episodes_analysis.ipynb @@ -0,0 +1,252 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Success vs. Total Average Episodes" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "For each model across ALL tasks and trials:\n", + "\n", + "1. TOTAL AVERAGE EPISODES:\n", + " - Total episodes = sum of all episode counts across all trials for that model\n", + " - Total trials = count of all trials for that model \n", + " - Total avg episodes = total episodes / total trials\n", + " \n", + " This gives us the average number of episodes a model needs per trial,\n", + " aggregated across all tasks it attempted.\n", + "\n", + "2. SUCCESS RATE:\n", + " - Successful trials = count of trials where reward = 1\n", + " - Success rate = successful trials / total trials\n", + " \n", + " This gives us the proportion of trials where the model succeeded." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "import json\n", + "from pathlib import Path\n", + "from scipy import stats\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def load_episode_data():\n", + " # TODO: Set path to your terminus2 data directory (output from get_terminus2_runs.py)\n", + " episode_file = Path(\"../../../terminus2_9-17_essential_files/episode_counts.json\")\n", + " \n", + " with open(episode_file, 'r') as f:\n", + " episode_data = json.load(f)\n", + " \n", + " df = pd.DataFrame(episode_data)\n", + " \n", + " required_columns = ['trial_id', 'episode_count', 'model_name', 'task_name', 'reward']\n", + " df = df[df[required_columns].notna().all(axis=1)].copy()\n", + " df = df[df['episode_count'] >= 0].copy()\n", + " \n", + " return df\n", + "\n", + "df = load_episode_data()\n", + "print(f\"Loaded {len(df)} valid trials\")\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def calculate_model_statistics(df):\n", + " model_stats = []\n", + " \n", + " for model_name in df['model_name'].unique():\n", + " model_data = df[df['model_name'] == model_name]\n", + " \n", + " total_episodes = model_data['episode_count'].sum()\n", + " total_trials = len(model_data)\n", + " successful_trials = len(model_data[model_data['reward'] == 1])\n", + " success_rate = successful_trials / total_trials if total_trials > 0 else 0\n", + " \n", + " model_stats.append({\n", + " 'model_name': model_name,\n", + " 'total_episodes': total_episodes,\n", + " 'total_trials': total_trials,\n", + " 'successful_trials': successful_trials,\n", + " 'success_rate': success_rate\n", + " })\n", + " \n", + " stats_df = pd.DataFrame(model_stats)\n", + " stats_df = stats_df.sort_values('success_rate', ascending=False)\n", + " \n", + " return stats_df\n", + "\n", + "stats_df = calculate_model_statistics(df)\n", + "display(stats_df.head(10))\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def simplify_model_name(model_name):\n", + " model_names = {\n", + " \"claude-sonnet-4-20250514\": \"Claude Sonnet 4\",\n", + " \"claude-opus-4-1-20250805\": \"Claude Opus 4.1\",\n", + " \"gpt-5\": \"GPT-5\",\n", + " \"gpt-5-mini\": \"GPT-5-Mini\",\n", + " \"gpt-5-nano\": \"GPT-5-Nano\",\n", + " \"grok-4-0709\": \"Grok 4\",\n", + " \"grok-code-fast-1\": \"Grok Code Fast 1\",\n", + " \"gemini-2.5-pro\": \"Gemini 2.5 Pro\",\n", + " \"gemini-2.5-flash\": \"Gemini 2.5 Flash\",\n", + " \"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8\": \"Qwen 3 Coder 480B\",\n", + " \"openai/gpt-oss-120b\": \"GPT-OSS 120B\",\n", + " \"OpenAI/gpt-oss-20B\": \"GPT-OSS 20B\",\n", + " \"moonshotai/Kimi-K2-Instruct-0905\": \"Kimi K2\",\n", + " \"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8\": \"Llama 4 Maverick 17B\",\n", + " \"zai-org/GLM-4.5-Air-FP8\": \"GLM 4.5 Air\",\n", + " \"deepseek-ai/DeepSeek-V3.1\": \"DeepSeek V3.1\",\n", + " }\n", + " return model_names.get(model_name, model_name)\n", + "\n", + "def extract_provider_from_model(model_name):\n", + " if 'claude' in model_name.lower():\n", + " return 'Anthropic'\n", + " elif 'gpt' in model_name.lower() or 'openai' in model_name.lower():\n", + " return 'OpenAI'\n", + " elif 'gemini' in model_name.lower():\n", + " return 'Google'\n", + " elif 'deepseek' in model_name.lower():\n", + " return 'DeepSeek'\n", + " elif 'kimi' in model_name.lower() or 'moonshot' in model_name.lower():\n", + " return 'Moonshot'\n", + " elif 'qwen' in model_name.lower():\n", + " return 'Alibaba'\n", + " elif 'grok' in model_name.lower():\n", + " return 'xAI'\n", + " elif 'glm' in model_name.lower() or 'zai-org' in model_name.lower():\n", + " return 'Zhipu'\n", + " elif 'llama' in model_name.lower() or 'meta' in model_name.lower():\n", + " return 'Meta'\n", + " else:\n", + " return 'Other'\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def create_scatter_plot(stats_df):\n", + " fig, ax = plt.subplots(figsize=(14, 10))\n", + " \n", + " stats_df = stats_df.copy()\n", + " stats_df['provider'] = stats_df['model_name'].apply(extract_provider_from_model)\n", + " \n", + " provider_colors = {\n", + " 'OpenAI': '#d62728',\n", + " 'Anthropic': '#2ca02c',\n", + " 'Google': '#ff7f0e',\n", + " 'xAI': '#bcbd22',\n", + " 'DeepSeek': '#9467bd',\n", + " 'Meta': '#8c564b',\n", + " 'Moonshot': '#e377c2',\n", + " 'Alibaba': '#7f7f7f',\n", + " 'Zhipu': '#17becf',\n", + " 'Other': '#1f77b4'\n", + " }\n", + " \n", + " stats_df['total_avg_episodes'] = stats_df['total_episodes'] / stats_df['total_trials']\n", + " \n", + " for provider in stats_df['provider'].unique():\n", + " provider_data = stats_df[stats_df['provider'] == provider]\n", + " ax.scatter(provider_data['total_avg_episodes'], provider_data['success_rate'],\n", + " c=provider_colors.get(provider, '#95A5A6'), \n", + " label=provider, s=100, alpha=0.7, edgecolors='black', linewidth=1)\n", + " \n", + " x = stats_df['total_avg_episodes']\n", + " y = stats_df['success_rate']\n", + " \n", + " correlation, p_value = stats.pearsonr(x, y)\n", + " \n", + " z = np.polyfit(x, y, 1)\n", + " p = np.poly1d(z)\n", + " ax.plot(x, p(x), \"r--\", alpha=0.8, linewidth=2, \n", + " label=f'Trend Line (r={correlation:.3f}, p={p_value:.3f})')\n", + " \n", + " for _, row in stats_df.iterrows():\n", + " display_name = simplify_model_name(row['model_name'])\n", + " x_pos = row['total_avg_episodes']\n", + " y_pos = row['success_rate']\n", + " \n", + " base_offset = (-8, 0)\n", + " if display_name == 'Grok 4':\n", + " base_offset = (8, 8)\n", + " \n", + " ha = 'right' if base_offset[0] < 0 else 'left'\n", + " \n", + " ax.annotate(display_name, \n", + " (x_pos, y_pos),\n", + " xytext=base_offset, textcoords='offset points',\n", + " fontsize=10, ha=ha, va='center')\n", + " \n", + " ax.set_xlabel('Total Average Episodes', fontsize=12, fontweight='bold')\n", + " ax.set_ylabel('Success Rate', fontsize=12, fontweight='bold')\n", + " ax.set_title('Total Average Episodes vs Success Rate', fontsize=14, fontweight='bold')\n", + " \n", + " ax.yaxis.set_major_formatter(plt.FuncFormatter(lambda y, _: f'{y:.2f}'))\n", + " ax.grid(True, alpha=0.3)\n", + " ax.set_xlim(left=0)\n", + " ax.set_ylim(bottom=0, top=max(stats_df['success_rate']) * 1.1)\n", + " ax.legend(bbox_to_anchor=(1.05, 1), loc='upper left')\n", + " \n", + " plt.tight_layout()\n", + " plt.savefig('total_avg_episodes_vs_success.png', dpi=300, bbox_inches='tight')\n", + " plt.savefig('total_avg_episodes_vs_success.pdf', dpi=300, bbox_inches='tight')\n", + " plt.show()\n", + " \n", + " return correlation, p_value\n", + "\n", + "correlation, p_value = create_scatter_plot(stats_df)\n", + "print(f\"Correlation: {correlation:.3f}, p-value: {p_value:.3f}\")\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "stats_df.to_csv('model_total_statistics.csv', index=False)\n", + "print(f\"Saved statistics for {len(stats_df)} models\")\n" + ] + } + ], + "metadata": { + "language_info": { + "name": "python" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/scripts/get_terminus2_runs.py b/scripts/get_terminus2_runs.py new file mode 100644 index 0000000..f120e6f --- /dev/null +++ b/scripts/get_terminus2_runs.py @@ -0,0 +1,147 @@ +#!/usr/bin/env python3 +""" +Simple script to download essential files and get episode counts for terminus-2 trials. +""" + +import os +import json +import time +from pathlib import Path +from dotenv import load_dotenv +from supabase import create_client + +load_dotenv() + +def download_file(client, trial_id, file_path, output_path): + """Download a single file from Supabase storage""" + try: + response = client.storage.from_("trials").download(f"{trial_id}/{file_path}") + with open(output_path, 'wb') as f: + f.write(response) + return True + except: + return False + +def count_episodes(client, trial_id): + """Count episodes by listing directories in Supabase storage""" + try: + response = client.storage.from_("trials").list(f"{trial_id}/agent") + if response: + return len([item for item in response if item.get('name', '').startswith('episode-')]) + return 0 + except: + return -1 + +def process_trial(client, trial, output_dir): + """Download essential files and get episode count for one trial""" + trial_id = trial["id"] + trial_dir = output_dir / trial_id + trial_dir.mkdir(parents=True, exist_ok=True) + + # Download essential files + files_to_download = [ + ("config.json", "config.json"), + ("result.json", "result.json"), + ("agent/recording.cast", "recording.cast") + ] + + downloaded = 0 + for supabase_path, local_filename in files_to_download: + output_path = trial_dir / local_filename + if download_file(client, trial_id, supabase_path, output_path): + downloaded += 1 + + # Get episode count + episode_count = count_episodes(client, trial_id) + + # Save episode count to file + if episode_count >= 0: + with open(trial_dir / "episode_count.txt", 'w') as f: + f.write(f"{episode_count}\n") + + # Extract trial metadata for JSON + trial_model = trial.get("trial_model", {}) + model_name = trial_model.get("model_name", "Unknown") if trial_model else "Unknown" + + verifier_result = trial.get("verifier_result") or {} + reward = verifier_result.get("reward", 0) if isinstance(verifier_result, dict) else 0 + + trial_data = { + "trial_id": trial_id, + "trial_name": trial.get("trial_name", "Unknown"), + "agent_name": trial.get("agent_name", "Unknown"), + "agent_version": trial.get("agent_version", "Unknown"), + "created_at": trial.get("created_at", "Unknown"), + "task_name": trial.get("task_name", "Unknown"), + "model_name": model_name, + "reward": reward, + "episode_count": episode_count if episode_count >= 0 else None + } + + return downloaded, episode_count, trial_data + +def main(): + client = create_client( + supabase_url=os.environ["SUPABASE_URL"], + supabase_key=os.environ["SUPABASE_PUBLISHABLE_KEY"], + ) + + # TODO: Set output directory path for downloaded files + output_dir = Path(__file__).parent.parent.parent / "terminus2_9-17_essential_files" + output_dir.mkdir(exist_ok=True) + + all_trials = [] + offset = 0 + batch_size = 1000 + + while True: + response = ( + client.table("trial") + .select("*, task!inner(*, dataset_task!inner(*)), trial_model!inner(*)") + .or_("exception_info.is.null,exception_info->>exception_type.eq.AgentTimeoutError") + .eq("task.dataset_task.dataset_name", "terminal-bench") + .eq("task.dataset_task.dataset_version", "2.0") + .eq("agent_name", "terminus-2") + .gte("created_at", "2025-09-17T01:13:33.950824+00:00") + .range(offset, offset + batch_size - 1) + .execute() + ) + + batch_trials = response.data + if not batch_trials: + break + + all_trials.extend(batch_trials) + + if len(batch_trials) < batch_size: + break + + offset += batch_size + + if not all_trials: + return + + success_count = 0 + total_files = 0 + all_trial_data = [] + + for trial in all_trials: + trial_id = trial["id"] + downloaded, episode_count, trial_data = process_trial(client, trial, output_dir) + total_files += downloaded + all_trial_data.append(trial_data) + + if downloaded == 3 and episode_count >= 0: + success_count += 1 + + time.sleep(0.1) + + # Save episode counts JSON + json_file = output_dir / "episode_counts.json" + with open(json_file, 'w') as f: + json.dump(all_trial_data, f, indent=2) + + print(f"Processed {len(all_trials)} trials, {success_count} successful, {total_files} files downloaded") + +if __name__ == "__main__": + main()