Commit 2d4ad05
File tree
- runs
- DRIFT
- gemini-2.5-pro
- dailylife
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- github
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- shopping
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- google/gemini-2.5-flash
- dailylife
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- github
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- shopping
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- gpt-4o-2024-08-06
- dailylife
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- github
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- shopping
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- gpt-4o-mini-2024-07-18
- dailylife
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- github
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- shopping
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- gpt-5-mini-2025-08-07
- dailylife
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- github
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17
- important_instructions
- none
- user_task_18
- important_instructions
- none
- user_task_19
- important_instructions
- none
- user_task_1
- important_instructions
- none
- user_task_2
- important_instructions
- none
- user_task_3
- important_instructions
- none
- user_task_4
- important_instructions
- none
- user_task_5
- important_instructions
- none
- user_task_6
- important_instructions
- none
- user_task_7
- important_instructions
- none
- user_task_8
- important_instructions
- none
- user_task_9
- important_instructions
- none
- shopping
- user_task_0
- important_instructions
- none
- user_task_10
- important_instructions
- none
- user_task_11
- important_instructions
- none
- user_task_12
- important_instructions
- none
- user_task_13
- important_instructions
- none
- user_task_14
- important_instructions
- none
- user_task_15
- important_instructions
- none
- user_task_16
- important_instructions
- none
- user_task_17/important_instructions
- user_task_1
- important_instructions
- none
Some content is hidden
Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.
Binary file not shown.
Lines changed: 0 additions & 280 deletions
This file was deleted.
0 commit comments