Spaces:

MilesCranmer
/

PySR

Running

App Files Files Community

MilesCranmer commited on Oct 13, 2020

Commit

15fbc5f

1 Parent(s): c6b4cc5

Track frequency of complexities, and try to invert

Browse files

Files changed (3) hide show

TODO.md +1 -1
julia/sr.jl +18 -9
pysr/sr.py +5 -0

TODO.md CHANGED Viewed

@@ -57,6 +57,7 @@
 - [x] Better cleanup of zombie processes after <ctl-c>
 - [x] Consider printing output sorted by score, not by complexity.
 - [x] Increase max complexity slowly over time up to the actual max.
 - [ ] Sort these todo lists by priority
 ## Feature ideas
@@ -78,7 +79,6 @@
 ## Algorithmic performance ideas:
-- [ ] **Record density over complexity. Favor equations that have a density we have not explored yet. Want the final density to be evenly distributed.**
 - [ ] Use package compiler and compile sr.jl into a standalone binary that can be used by pysr.
 - [ ] When doing equation warmup, only migrate those equations with almost the same complexity. Rather than having to consider simple equations later in the game.

 - [x] Better cleanup of zombie processes after <ctl-c>
 - [x] Consider printing output sorted by score, not by complexity.
 - [x] Increase max complexity slowly over time up to the actual max.
+- [x] Record density over complexity. Favor equations that have a density we have not explored yet. Want the final density to be evenly distributed.
 - [ ] Sort these todo lists by priority
 ## Feature ideas
 ## Algorithmic performance ideas:
 - [ ] Use package compiler and compile sr.jl into a standalone binary that can be used by pysr.
 - [ ] When doing equation warmup, only migrate those equations with almost the same complexity. Rather than having to consider simple equations later in the game.

julia/sr.jl CHANGED Viewed

@@ -691,7 +691,7 @@ end
 # Go through one simulated annealing mutation cycle
 #  exp(-delta/T) defines probability of accepting a change
-function iterate(member::PopMember, T::Float32, curmaxsize::Integer)::PopMember
     prev = member.tree
     tree = prev
     #TODO - reconsider this
@@ -801,6 +801,11 @@ function iterate(member::PopMember, T::Float32, curmaxsize::Integer)::PopMember
     if annealing
         delta = afterLoss - beforeLoss
         probChange = exp(-delta/(T*alpha))
         return_unaltered = (isnan(afterLoss) || probChange < rand())
         if return_unaltered
@@ -863,7 +868,8 @@ end
 # Pass through the population several times, replacing the oldest
 # with the fittest of a small subsample
-function regEvolCycle(pop::Population, T::Float32, curmaxsize::Integer)::Population
     # Batch over each subsample. Can give 15% improvement in speed; probably moreso for large pops.
     # but is ultimately a different algorithm than regularized evolution, and might not be
     # as good.
@@ -884,7 +890,7 @@ function regEvolCycle(pop::Population, T::Float32, curmaxsize::Integer)::Populat
                 end
             end
             allstar = pop.members[best_idx]
-            babies[i] = iterate(allstar, T, curmaxsize)
         end
         # Replace the n_evol_cycles-oldest members of each population
@@ -895,7 +901,7 @@ function regEvolCycle(pop::Population, T::Float32, curmaxsize::Integer)::Populat
     else
         for i=1:round(Integer, pop.n/ns)
             allstar = bestOfSample(pop)
-            baby = iterate(allstar, T, curmaxsize)
             #printTree(baby.tree)
             oldest = argmin([pop.members[member].birth for member=1:pop.n])
             pop.members[oldest] = baby
@@ -910,16 +916,17 @@ end
 function run(
         pop::Population,
         ncycles::Integer,
-        curmaxsize::Integer;
         verbosity::Integer=0
        )::Population
     allT = LinRange(1.0f0, 0.0f0, ncycles)
     for iT in 1:size(allT)[1]
         if annealing
-            pop = regEvolCycle(pop, allT[iT], curmaxsize)
         else
-            pop = regEvolCycle(pop, 1.0f0, curmaxsize)
         end
         if verbosity > 0 && (iT % verbosity == 0)
@@ -1062,6 +1069,7 @@ function fullRun(niterations::Integer;
     channels = [RemoteChannel(1) for j=1:npopulations]
     bestSubPops = [Population(1) for j=1:npopulations]
     hallOfFame = HallOfFame()
     curmaxsize = 3
     if warmupMaxsize == 0
         curmaxsize = maxsize
@@ -1074,7 +1082,7 @@ function fullRun(niterations::Integer;
     # # 2. Start the cycle on every process:
     @sync for i=1:npopulations
-        @async allPops[i] = @spawnat :any run(fetch(allPops[i]), ncyclesperiteration, curmaxsize, verbosity=verbosity)
     end
     println("Started!")
     cycles_complete = npopulations * niterations
@@ -1103,6 +1111,7 @@ function fullRun(niterations::Integer;
                 for member in cur_pop.members
                     size = countNodes(member.tree)
                     if member.score < hallOfFame.members[size].score
                         hallOfFame.members[size] = deepcopy(member)
                         hallOfFame.exists[size] = true
@@ -1164,7 +1173,7 @@ function fullRun(niterations::Integer;
                 @async begin
                     allPops[i] = @spawnat :any let
-                        tmp_pop = run(cur_pop, ncyclesperiteration, curmaxsize, verbosity=verbosity)
                         @inbounds @simd for j=1:tmp_pop.n
                             if rand() < 0.1
                                 tmp_pop.members[j].tree = simplifyTree(tmp_pop.members[j].tree)

 # Go through one simulated annealing mutation cycle
 #  exp(-delta/T) defines probability of accepting a change
+function iterate(member::PopMember, T::Float32, curmaxsize::Integer, frequencyComplexity::Array{Float32, 1})::PopMember
     prev = member.tree
     tree = prev
     #TODO - reconsider this
     if annealing
         delta = afterLoss - beforeLoss
         probChange = exp(-delta/(T*alpha))
+        if useFrequency
+            oldSize = countNodes(prev)
+            newSize = countNodes(tree)
+            probChange *= frequencyComplexity[oldSize] / frequencyComplexity[newSize]
+        end
         return_unaltered = (isnan(afterLoss) || probChange < rand())
         if return_unaltered
 # Pass through the population several times, replacing the oldest
 # with the fittest of a small subsample
+function regEvolCycle(pop::Population, T::Float32, curmaxsize::Integer,
+                      frequencyComplexity::Array{Float32, 1})::Population
     # Batch over each subsample. Can give 15% improvement in speed; probably moreso for large pops.
     # but is ultimately a different algorithm than regularized evolution, and might not be
     # as good.
                 end
             end
             allstar = pop.members[best_idx]
+            babies[i] = iterate(allstar, T, curmaxsize, frequencyComplexity)
         end
         # Replace the n_evol_cycles-oldest members of each population
     else
         for i=1:round(Integer, pop.n/ns)
             allstar = bestOfSample(pop)
+            baby = iterate(allstar, T, curmaxsize, frequencyComplexity)
             #printTree(baby.tree)
             oldest = argmin([pop.members[member].birth for member=1:pop.n])
             pop.members[oldest] = baby
 function run(
         pop::Population,
         ncycles::Integer,
+        curmaxsize::Integer,
+        frequencyComplexity::Array{Float32, 1};
         verbosity::Integer=0
        )::Population
     allT = LinRange(1.0f0, 0.0f0, ncycles)
     for iT in 1:size(allT)[1]
         if annealing
+            pop = regEvolCycle(pop, allT[iT], curmaxsize, frequencyComplexity)
         else
+            pop = regEvolCycle(pop, 1.0f0, curmaxsize, frequencyComplexity)
         end
         if verbosity > 0 && (iT % verbosity == 0)
     channels = [RemoteChannel(1) for j=1:npopulations]
     bestSubPops = [Population(1) for j=1:npopulations]
     hallOfFame = HallOfFame()
+    frequencyComplexity = ones(Float32, actualMaxsize)
     curmaxsize = 3
     if warmupMaxsize == 0
         curmaxsize = maxsize
     # # 2. Start the cycle on every process:
     @sync for i=1:npopulations
+        @async allPops[i] = @spawnat :any run(fetch(allPops[i]), ncyclesperiteration, curmaxsize, copy(frequencyComplexity)/sum(frequencyComplexity), verbosity=verbosity)
     end
     println("Started!")
     cycles_complete = npopulations * niterations
                 for member in cur_pop.members
                     size = countNodes(member.tree)
+                    frequencyComplexity[size] += 1
                     if member.score < hallOfFame.members[size].score
                         hallOfFame.members[size] = deepcopy(member)
                         hallOfFame.exists[size] = true
                 @async begin
                     allPops[i] = @spawnat :any let
+                        tmp_pop = run(cur_pop, ncyclesperiteration, curmaxsize, copy(frequencyComplexity)/sum(frequencyComplexity), verbosity=verbosity)
                         @inbounds @simd for j=1:tmp_pop.n
                             if rand() < 0.1
                                 tmp_pop.members[j].tree = simplifyTree(tmp_pop.members[j].tree)

pysr/sr.py CHANGED Viewed

@@ -90,6 +90,7 @@ def pysr(X=None, y=None, weights=None,
             select_k_features=None,
             warmupMaxsize=0,
             constraints={},
             limitPowComplexity=False, #deprecated
             threads=None, #deprecated
             julia_optimization=3,
@@ -172,6 +173,9 @@ def pysr(X=None, y=None, weights=None,
         arguments of operators. E.g., `'pow': (-1, 1)`
         says that power laws can have any complexity left argument, but only
         1 complexity exponent. Use this to force more interpretable solutions.
     :param julia_optimization: int, Optimization level (0, 1, 2, 3)
     :returns: pd.DataFrame, Results dataframe, giving complexity, MSE, and equations
         (as strings).
@@ -327,6 +331,7 @@ const mutationWeights = [
 ]
 const warmupMaxsize = {warmupMaxsize:d}
 const limitPowComplexity = {"true" if limitPowComplexity else "false"}
 """
     op_runner = ""

             select_k_features=None,
             warmupMaxsize=0,
             constraints={},
+            useFrequency=False,
             limitPowComplexity=False, #deprecated
             threads=None, #deprecated
             julia_optimization=3,
         arguments of operators. E.g., `'pow': (-1, 1)`
         says that power laws can have any complexity left argument, but only
         1 complexity exponent. Use this to force more interpretable solutions.
+    :param useFrequency: bool, whether to measure the frequency of complexities,
+        and use that instead of parsimony to explore equation space. Will
+        naturally find equations of all complexities.
     :param julia_optimization: int, Optimization level (0, 1, 2, 3)
     :returns: pd.DataFrame, Results dataframe, giving complexity, MSE, and equations
         (as strings).
 ]
 const warmupMaxsize = {warmupMaxsize:d}
 const limitPowComplexity = {"true" if limitPowComplexity else "false"}
+const useFrequency = {"true" if useFrequency else "false"}
 """
     op_runner = ""