Spaces:

MilesCranmer
/

PySR

Running

App Files Files Community

MilesCranmer commited on Jun 2, 2021

Commit

17f8bf1

1 Parent(s): f77e43f

Allow control over tournament selection parameters

Browse files

Files changed (3) hide show

Project.toml +1 -1
pysr/sr.py +16 -4
setup.py +1 -1

Project.toml CHANGED Viewed

@@ -2,5 +2,5 @@
 SymbolicRegression = "8254be44-1295-4e6a-a16d-46603ac705cb"
 [compat]
-SymbolicRegression = "0.6.0"
 julia = "1.5"

 SymbolicRegression = "8254be44-1295-4e6a-a16d-46603ac705cb"
 [compat]
+SymbolicRegression = "0.6.1"
 julia = "1.5"

pysr/sr.py CHANGED Viewed

@@ -123,7 +123,9 @@ def pysr(X, y, weights=None,
          optimizer_algorithm="BFGS",
          optimizer_nrestarts=3,
          optimize_probability=1.0,
-         optimizer_iterations=10
          ):
     """Run symbolic regression to fit f(X[i, :]) ~ y[i] for all i.
     Note: most default parameters have been tuned over several example
@@ -234,6 +236,10 @@ def pysr(X, y, weights=None,
     :type output_jax_format: bool
     :param output_torch_format: Whether to create a 'torch_format' column in the output, containing a torch module with trainable parameters.
     :type output_torch_format: bool
     :returns: Results dataframe, giving complexity, MSE, and equations (as strings), as well as functional forms. If list, each element corresponds to a dataframe of equations for each output.
     :type: pd.DataFrame/list
     """
@@ -259,12 +265,12 @@ def pysr(X, y, weights=None,
             progress = False
     assert optimizer_algorithm in ['NelderMead', 'BFGS']
     if isinstance(X, pd.DataFrame):
         variable_names = list(X.columns)
         X = np.array(X)
     if len(X.shape) == 1:
         X = X[:, None]
@@ -344,7 +350,9 @@ def pysr(X, y, weights=None,
                  output_jax_format=output_jax_format,
                  output_torch_format=output_torch_format,
                  selection=selection,
-                 multioutput=multioutput, nout=nout)
     kwargs = {**_set_paths(tempdir), **kwargs}
@@ -515,7 +523,9 @@ def _make_hyperparams_julia_str(X, alpha, annealing, batchSize, batching, binary
                                variable_names, warmupMaxsizeBy, weightAddNode,
                                ncyclesperiteration, fractionReplaced, topn, verbosity, progress, loss,
                                weightDeleteNode, weightDoNothing, weightInsertNode, weightMutateConstant,
-                               weightMutateOperator, weightRandomize, weightSimplify, weights, **kwargs):
     try:
         term_width = shutil.get_terminal_size().columns
     except:
@@ -586,6 +596,8 @@ mutationWeights=[
 warmupMaxsizeBy={warmupMaxsizeBy:f}f0,
 useFrequency={"true" if useFrequency else "false"},
 npop={npop:d},
 ncyclesperiteration={ncyclesperiteration:d},
 fractionReplaced={fractionReplaced:f}f0,
 topn={topn:d},

          optimizer_algorithm="BFGS",
          optimizer_nrestarts=3,
          optimize_probability=1.0,
+         optimizer_iterations=10,
+         tournament_selection_n=10,
+         tournament_selection_p=1.0
          ):
     """Run symbolic regression to fit f(X[i, :]) ~ y[i] for all i.
     Note: most default parameters have been tuned over several example
     :type output_jax_format: bool
     :param output_torch_format: Whether to create a 'torch_format' column in the output, containing a torch module with trainable parameters.
     :type output_torch_format: bool
+    :param tournament_selection_n: Number of expressions to consider in each tournament.
+    :type tournament_selection_n: int
+    :param tournament_selection_p: Probability of selecting the best expression in each tournament. The probability will decay as p*(1-p)^n for other expressions, sorted by loss.
+    :type tournament_selection_p: float
     :returns: Results dataframe, giving complexity, MSE, and equations (as strings), as well as functional forms. If list, each element corresponds to a dataframe of equations for each output.
     :type: pd.DataFrame/list
     """
             progress = False
     assert optimizer_algorithm in ['NelderMead', 'BFGS']
+    assert tournament_selection_n < npop
     if isinstance(X, pd.DataFrame):
         variable_names = list(X.columns)
         X = np.array(X)
     if len(X.shape) == 1:
         X = X[:, None]
                  output_jax_format=output_jax_format,
                  output_torch_format=output_torch_format,
                  selection=selection,
+                 multioutput=multioutput, nout=nout,
+                 tournament_selection_n=tournament_selection_n,
+                 tournament_selection_p=tournament_selection_p)
     kwargs = {**_set_paths(tempdir), **kwargs}
                                variable_names, warmupMaxsizeBy, weightAddNode,
                                ncyclesperiteration, fractionReplaced, topn, verbosity, progress, loss,
                                weightDeleteNode, weightDoNothing, weightInsertNode, weightMutateConstant,
+                               weightMutateOperator, weightRandomize, weightSimplify, weights,
+                               tournament_selection_n, tournament_selection_p,
+                               **kwargs):
     try:
         term_width = shutil.get_terminal_size().columns
     except:
 warmupMaxsizeBy={warmupMaxsizeBy:f}f0,
 useFrequency={"true" if useFrequency else "false"},
 npop={npop:d},
+ns={tournament_selection_n:d},
+probPickFirst={tournament_selection_p:f}f0,
 ncyclesperiteration={ncyclesperiteration:d},
 fractionReplaced={fractionReplaced:f}f0,
 topn={topn:d},

setup.py CHANGED Viewed

@@ -5,7 +5,7 @@ with open("README.md", "r") as fh:
 setuptools.setup(
     name="pysr",
-    version="0.6.0-1",
     author="Miles Cranmer",
     author_email="miles.cranmer@gmail.com",
     description="Simple and efficient symbolic regression",

 setuptools.setup(
     name="pysr",
+    version="0.6.1",
     author="Miles Cranmer",
     author_email="miles.cranmer@gmail.com",
     description="Simple and efficient symbolic regression",