Skip to content
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 4 additions & 0 deletions src/pg2_benchmark/dummy_data.py
Original file line number Diff line number Diff line change
Expand Up @@ -113,6 +113,10 @@ def charge_ladder_dataset(n_rows: int = 200, seq_len: int = 20) -> pd.DataFrame:
sequences = [
charge_mutations(parent, random.randint(0, seq_len)) for _ in range(n_rows)
]

# Deduplicate sequences
sequences = list(set(sequences))

Comment thread
tintinrevient marked this conversation as resolved.
charge = [peptide_charge(seq) for seq in sequences]
return pd.DataFrame({"sequence": sequences, "charge": charge})

Expand Down