Spaces:

MilesCranmer
/

PySR

Sleeping

App Files Files Community

MilesCranmer commited on Feb 26, 2021

Commit

67558da

1 Parent(s): 0a3b812

Warm up to a fraction of total training time

Browse files

Files changed (3) hide show

Project.toml +1 -1
pysr/sr.py +10 -8
setup.py +1 -1

Project.toml CHANGED Viewed

@@ -2,5 +2,5 @@
 SymbolicRegression = "8254be44-1295-4e6a-a16d-46603ac705cb"
 [compat]
-SymbolicRegression = "0.5.9"
 julia = "1.5"

 SymbolicRegression = "8254be44-1295-4e6a-a16d-46603ac705cb"
 [compat]
+SymbolicRegression = "0.5.10"
 julia = "1.5"

pysr/sr.py CHANGED Viewed

@@ -97,7 +97,7 @@ def pysr(X=None, y=None, weights=None,
             batching=False,
             batchSize=50,
             select_k_features=None,
-            warmupMaxsize=0,
             constraints={},
             useFrequency=False,
             tempdir=None,
@@ -106,7 +106,8 @@ def pysr(X=None, y=None, weights=None,
             julia_project=None,
             user_input=True,
             update=True,
-            temp_equation_file=False
         ):
     """Run symbolic regression to fit f(X[i, :]) ~ y[i] for all i.
     Note: most default parameters have been tuned over several example
@@ -191,10 +192,10 @@ def pysr(X=None, y=None, weights=None,
         Python using random forests, before passing to the symbolic regression
         code. None means no feature selection; an int means select that many
         features.
-    :param warmupMaxsize: int, whether to slowly increase max size from
         a small number up to the maxsize (if greater than 0).
-        If greater than 0, says how many cycles before the maxsize
-        is increased.
     :param constraints: dict of int (unary) or 2-tuples (binary),
         this enforces maxsize constraints on the individual
         arguments of operators. E.g., `'pow': (-1, 1)`
@@ -220,6 +221,7 @@ def pysr(X=None, y=None, weights=None,
         (as strings).
     """
     if isinstance(X, pd.DataFrame):
         variable_names = list(X.columns)
         X = np.array(X)
@@ -269,7 +271,7 @@ def pysr(X=None, y=None, weights=None,
                  shouldOptimizeConstants=shouldOptimizeConstants,
                  unary_operators=unary_operators, useFrequency=useFrequency,
                  use_custom_variable_names=use_custom_variable_names,
-                 variable_names=variable_names, warmupMaxsize=warmupMaxsize,
                  weightAddNode=weightAddNode,
                  weightDeleteNode=weightDeleteNode,
                  weightDoNothing=weightDoNothing,
@@ -418,7 +420,7 @@ def _make_hyperparams_julia_str(X, alpha, annealing, batchSize, batching, binary
                                maxdepth, maxsize, migration, nrestarts, npop,
                                parsimony, perturbationFactor, populations, procs, shouldOptimizeConstants,
                                unary_operators, useFrequency, use_custom_variable_names,
-                               variable_names, warmupMaxsize, weightAddNode,
                                ncyclesperiteration, fractionReplaced, topn, verbosity, progress, loss,
                                weightDeleteNode, weightDoNothing, weightInsertNode, weightMutateConstant,
                                weightMutateOperator, weightRandomize, weightSimplify, weights, **kwargs):
@@ -483,7 +485,7 @@ mutationWeights=[
     {weightRandomize:f},
     {weightDoNothing:f}
 ],
-warmupMaxsize={warmupMaxsize:d},
 useFrequency={"true" if useFrequency else "false"},
 npop={npop:d},
 ncyclesperiteration={ncyclesperiteration:d},

             batching=False,
             batchSize=50,
             select_k_features=None,
+            warmupMaxsizeBy=0.0,
             constraints={},
             useFrequency=False,
             tempdir=None,
             julia_project=None,
             user_input=True,
             update=True,
+            temp_equation_file=False,
+            warmupMaxsize=None, #Deprecated
         ):
     """Run symbolic regression to fit f(X[i, :]) ~ y[i] for all i.
     Note: most default parameters have been tuned over several example
         Python using random forests, before passing to the symbolic regression
         code. None means no feature selection; an int means select that many
         features.
+    :param warmupMaxsizeBy: float, whether to slowly increase max size from
         a small number up to the maxsize (if greater than 0).
+        If greater than 0, says the fraction of training time at which
+        the current maxsize will reach the user-passed maxsize.
     :param constraints: dict of int (unary) or 2-tuples (binary),
         this enforces maxsize constraints on the individual
         arguments of operators. E.g., `'pow': (-1, 1)`
         (as strings).
     """
+    assert warmupMaxsize == None, "warmupMaxsize is deprecated. Use warmupMaxsizeBy and give a fraction of time."
     if isinstance(X, pd.DataFrame):
         variable_names = list(X.columns)
         X = np.array(X)
                  shouldOptimizeConstants=shouldOptimizeConstants,
                  unary_operators=unary_operators, useFrequency=useFrequency,
                  use_custom_variable_names=use_custom_variable_names,
+                 variable_names=variable_names, warmupMaxsizeBy=warmupMaxsizeBy,
                  weightAddNode=weightAddNode,
                  weightDeleteNode=weightDeleteNode,
                  weightDoNothing=weightDoNothing,
                                maxdepth, maxsize, migration, nrestarts, npop,
                                parsimony, perturbationFactor, populations, procs, shouldOptimizeConstants,
                                unary_operators, useFrequency, use_custom_variable_names,
+                               variable_names, warmupMaxsizeBy, weightAddNode,
                                ncyclesperiteration, fractionReplaced, topn, verbosity, progress, loss,
                                weightDeleteNode, weightDoNothing, weightInsertNode, weightMutateConstant,
                                weightMutateOperator, weightRandomize, weightSimplify, weights, **kwargs):
     {weightRandomize:f},
     {weightDoNothing:f}
 ],
+warmupMaxsizeBy={warmupMaxsizeBy:f}f0,
 useFrequency={"true" if useFrequency else "false"},
 npop={npop:d},
 ncyclesperiteration={ncyclesperiteration:d},

setup.py CHANGED Viewed

@@ -5,7 +5,7 @@ with open("README.md", "r") as fh:
 setuptools.setup(
     name="pysr", # Replace with your own username
-    version="0.5.9",
     author="Miles Cranmer",
     author_email="[email protected]",
     description="Simple and efficient symbolic regression",

 setuptools.setup(
     name="pysr", # Replace with your own username
+    version="0.5.10",
     author="Miles Cranmer",
     author_email="[email protected]",
     description="Simple and efficient symbolic regression",