From 7e4f3067ac33a3c668517f6549e1433d8ebf9b9f Mon Sep 17 00:00:00 2001 From: Manuel Lera-Ramirez Date: Wed, 31 Jul 2024 12:22:10 +0100 Subject: [PATCH] fix design and add tests --- src/pydna/design.py | 50 ++++++++++++++++++++++++++----------- tests/test_module_design.py | 37 +++++++++++++++++++++++++++ 2 files changed, 72 insertions(+), 15 deletions(-) diff --git a/src/pydna/design.py b/src/pydna/design.py index 3f6bd463..be7a5904 100755 --- a/src/pydna/design.py +++ b/src/pydna/design.py @@ -30,34 +30,44 @@ _module_logger = _logging.getLogger("pydna." + __name__) -def get_tm_and_primer(target_tm, template, limit, tm_func, starting_temp=0) -> Tuple[float, str]: +def _design_primer( + target_tm: float, template: _Dseqrecord, limit: int, tm_func, starting_length: int = 0 +) -> Tuple[float, str]: """returns a tuple (temp, primer)""" - tmp = starting_temp - length = limit + + if starting_length < limit: + starting_length = limit + + length = starting_length tlen = len(template) + + tmp = tm_func(str(template.seq[:length])) + p = str(template.seq[:length]) - if starting_temp < target_tm: + if tmp < target_tm: condition = _operator.le increment = 1 else: condition = _operator.ge increment = -1 while condition(tmp, target_tm): + prev_temp = tmp + prev_primer = p length += increment p = str(template.seq[:length]) tmp = tm_func(p) - if length >= tlen or length == 0: + if length >= tlen: break - ps = p[:-1] - tmps = tm_func(str(ps)) - _module_logger.debug(((p, tmp), (ps, tmps))) - return min((abs(target_tm - tmp), p), (abs(target_tm - tmps), ps)) + # Never go below the limit + if length < limit: + return template.seq[:limit] - -def get_tm_and_primer_with_estimate(target_tm, template, limit, tm_func, estimate_function): - first_temp, first_guess = get_tm_and_primer(target_tm, template, limit, estimate_function) - return get_tm_and_primer(target_tm, template, len(first_guess), tm_func, first_temp) + _module_logger.debug(((p, tmp), (prev_primer, prev_temp))) + if abs(target_tm - tmp) < abs(target_tm - prev_temp): + return p + else: + return prev_primer def primer_design( @@ -71,12 +81,21 @@ def primer_design( The optional fp and rp arguments can contain an existing primer for the sequence (either the forward or reverse primer). One or the other primers can be specified, not both (since then there is nothing to design!, use the pydna.amplify.pcr function instead). + The limit argument is the minimum length of the primer. The default value is 13. + If one of the primers is given, the other primer is designed to match in terms of Tm. If both primers are designed, they will be designed to target_tm tm_func is a function that takes an ascii string representing an oligonuceotide as argument and returns a float. Some useful functions can be found in the :mod:`pydna.tm` module, but can be substituted for a custom made function. + estimate_function is a tm_func-like function that is used to get a first guess for the primer design, that is then used as starting + point for the final result. This is useful when the tm_func function is slow to calculate (e.g. it relies on an + external API, such as the NEB primer design API). The estimate_function should be faster than the tm_func function. + The default value is `None`. + To use the default `tm_func` as estimate function to get the NEB Tm faster, you can do: + `primer_design(dseqr, target_tm=55, tm_func=tm_neb, estimate_function=tm_default)`. + The function returns a pydna.amplicon.Amplicon class instance. This object has the object.forward_primer and object.reverse_primer properties which contain the designed primers. @@ -153,9 +172,10 @@ def primer_design( def design(target_tm, template): if estimate_function: - return get_tm_and_primer_with_estimate(target_tm, template, limit, tm_func, estimate_function)[1] + first_guess = _design_primer(target_tm, template, limit, estimate_function) + return _design_primer(target_tm, template, limit, tm_func, len(first_guess)) else: - return get_tm_and_primer(target_tm, template, limit, tm_func)[1] + return _design_primer(target_tm, template, limit, tm_func) if not fp and not rp: _module_logger.debug("no primer given, design forward primer:") diff --git a/tests/test_module_design.py b/tests/test_module_design.py index 28e7039b..8c2fefc6 100755 --- a/tests/test_module_design.py +++ b/tests/test_module_design.py @@ -309,5 +309,42 @@ def test_too_short_template(): assert primer_design(fragment) == Amplicon("") +def test_get_tm_and_primer_from_above_and_below(): + """Starting from higher and lower lengths gives the same value""" + from pydna.design import _design_primer + from pydna.tm import tm_default + + for f in frags: + for temp in [40, 45, 50, 55]: + assert _design_primer(temp, f, 13, tm_default) == _design_primer(temp, f, 13, tm_default, 40) + + +def test_use_estimate_function(): + from pydna.design import primer_design + from pydna.tm import tm_default + + def tm_alt_lower(*args): + return tm_default(*args) - 10 + + def tm_alt_upper(*args): + return tm_default(*args) + 10 + + for f in frags: + for temp in [40, 45, 50, 55]: + amp_lower_with_estimate = primer_design( + f, target_tm=temp, tm_func=tm_alt_lower, estimate_function=tm_default + ) + amp_lower_no_estimate = primer_design(f, target_tm=temp, tm_func=tm_alt_lower) + + assert amp_lower_with_estimate == amp_lower_no_estimate + + amp_upper_with_estimate = primer_design( + f, target_tm=temp, tm_func=tm_alt_upper, estimate_function=tm_default + ) + amp_upper_no_estimate = primer_design(f, target_tm=temp, tm_func=tm_alt_upper) + + assert amp_upper_with_estimate == amp_upper_no_estimate + + if __name__ == "__main__": pytest.cmdline.main([__file__, "-v", "-s"])