修复错误 python 数独使用遗传算法？

问题描述

""" Solves a Sudoku puzzle using a genetic algorithm. This is based on a piece of coursework produced 
by Christian Thomas Jacobs as part of the CS3M6 Evolutionary computation module at the University of 
Reading.
copyright (c) 2009,2017 Christian Thomas Jacobs
"""
from functools import cmp_to_key
import numpy
import random
random.seed()

Nd = 9  # Number of digits (in the case of standard Sudoku puzzles,this is 9).


class Population(object):
""" A set of candidate solutions to the Sudoku puzzle. These candidates are also kNown as the chromosomes in the population. """

def __init__(self):
    self.candidates = []
    return

def seed(self,Nc,given):
    self.candidates = []
    
    # Determine the legal values that each square can take.
    helper = Candidate()
    helper.values = [[[] for j in range(0,Nd)] for i in range(0,Nd)]
    for row in range(0,Nd):
        for column in range(0,Nd):
            for value in range(1,10):
                if((given.values[row][column] == 0) and not (given.is_column_duplicate(column,value) or given.is_block_duplicate(row,column,value) or given.is_row_duplicate(row,value))):
                    # Value is available.
                    helper.values[row][column].append(value)
                elif(given.values[row][column] != 0):
                    # Given/kNown value from file.
                    helper.values[row][column].append(given.values[row][column])
                    break

    # Seed a new population.       
    for p in range(0,Nc):
        g = Candidate()
        for i in range(0,Nd): # New row in candidate.
            row = numpy.zeros(Nd)
            
            # Fill in the givens.
            for j in range(0,Nd): # New column j value in row i.
            
                # If value is already given,don't change it.
                if(given.values[i][j] != 0):
                    row[j] = given.values[i][j]
                # Fill in the gaps using the helper board.
                elif(given.values[i][j] == 0):
                    row[j] = helper.values[i][j][random.randint(0,len(helper.values[i][j])-1)]

            # If we don't have a valid board,then try again. There must be no duplicates in the row.
            while(len(list(set(row))) != Nd):
                for j in range(0,Nd):
                    if(given.values[i][j] == 0):
                        row[j] = helper.values[i][j][random.randint(0,len(helper.values[i][j])-1)]

            g.values[i] = row

        self.candidates.append(g)
    
    # Compute the fitness of all candidates in the population.
    self.update_fitness()
    
    print("seeding complete.")
    
    return
    
def update_fitness(self):
    """ Update fitness of every candidate/chromosome. """
    for candidate in self.candidates:
        candidate.update_fitness()
    return
    
def sort(self):
    """ Sort the population based on fitness. """
    self.candidates.sort(key=cmp_to_key(self.sort_fitness))
    return

def sort_fitness(self,x,y):
    """ The sorting function. """
    if(x.fitness < y.fitness):
        return 1
    elif(x.fitness == y.fitness):
        return 0
    else:
        return -1


class Candidate(object):
""" A candidate solutions to the Sudoku puzzle. """
def __init__(self):
    self.values = numpy.zeros((Nd,Nd),dtype=int)
    self.fitness = None
    return

def update_fitness(self):
    """ The fitness of a candidate solution is determined by how close it is to being the actual solution to the puzzle. The actual solution (i.e. the 'fittest') is defined as a 9x9 grid of numbers in the range [1,9] where each row,column and 3x3 block contains the numbers [1,9] without any duplicates (see e.g. http://www.sudoku.com/); if there are any duplicates then the fitness will be lower. """
    
    row_count = numpy.zeros(Nd)
    column_count = numpy.zeros(Nd)
    block_count = numpy.zeros(Nd)
    row_sum = 0
    column_sum = 0
    block_sum = 0

    for i in range(0,Nd):  # For each row...
        for j in range(0,Nd):  # For each number within it...
            row_count[self.values[i][j]-1] += 1  # ...Update list with occurrence of a particular number.

        row_sum += (1.0/len(set(row_count)))/Nd
        row_count = numpy.zeros(Nd)

    for i in range(0,Nd):  # For each column...
        for j in range(0,Nd):  # For each number within it...
            column_count[self.values[j][i]-1] += 1  # ...Update list with occurrence of a particular number.

        column_sum += (1.0 / len(set(column_count)))/Nd
        column_count = numpy.zeros(Nd)


    # For each block...
    for i in range(0,Nd,3):
        for j in range(0,3):
            block_count[self.values[i][j]-1] += 1
            block_count[self.values[i][j+1]-1] += 1
            block_count[self.values[i][j+2]-1] += 1
            
            block_count[self.values[i+1][j]-1] += 1
            block_count[self.values[i+1][j+1]-1] += 1
            block_count[self.values[i+1][j+2]-1] += 1
            
            block_count[self.values[i+2][j]-1] += 1
            block_count[self.values[i+2][j+1]-1] += 1
            block_count[self.values[i+2][j+2]-1] += 1

            block_sum += (1.0/len(set(block_count)))/Nd
            block_count = numpy.zeros(Nd)

    # Calculate overall fitness.
    if (int(row_sum) == 1 and int(column_sum) == 1 and int(block_sum) == 1):
        fitness = 1.0
    else:
        fitness = column_sum * block_sum
    
    self.fitness = fitness
    return
    
def mutate(self,mutation_rate,given):
    """ Mutate a candidate by picking a row,and then picking two values within that row to swap. """

    r = random.uniform(0,1.1)
    while(r > 1): # Outside [0,1] boundary - choose another
        r = random.uniform(0,1.1)

    success = False
    if (r < mutation_rate):  # Mutate.
        while(not success):
            row1 = random.randint(0,8)
            row2 = random.randint(0,8)
            row2 = row1
            
            from_column = random.randint(0,8)
            to_column = random.randint(0,8)
            while(from_column == to_column):
                from_column = random.randint(0,8)
                to_column = random.randint(0,8)   

            # Check if the two places are free...
            if(given.values[row1][from_column] == 0 and given.values[row1][to_column] == 0):
                # ...and that we are not causing a duplicate in the rows' columns.
                if(not given.is_column_duplicate(to_column,self.values[row1][from_column])
                   and not given.is_column_duplicate(from_column,self.values[row2][to_column])
                   and not given.is_block_duplicate(row2,to_column,self.values[row1][from_column])
                   and not given.is_block_duplicate(row1,from_column,self.values[row2][to_column])):
                
                    # Swap values.
                    temp = self.values[row2][to_column]
                    self.values[row2][to_column] = self.values[row1][from_column]
                    self.values[row1][from_column] = temp
                    success = True

    return success


class Given(Candidate):
""" The grid containing the given/kNown values. """

def __init__(self,values):
    self.values = values
    return
    
def is_row_duplicate(self,row,value):
    """ Check whether there is a duplicate of a fixed/given value in a row. """
    for column in range(0,Nd):
        if(self.values[row][column] == value):
           return True
    return False

def is_column_duplicate(self,value):
    """ Check whether there is a duplicate of a fixed/given value in a column. """
    for row in range(0,Nd):
        if(self.values[row][column] == value):
           return True
    return False

def is_block_duplicate(self,value):
    """ Check whether there is a duplicate of a fixed/given value in a 3 x 3 block. """
    i = 3*(int(row/3))
    j = 3*(int(column/3))

    if((self.values[i][j] == value)
       or (self.values[i][j+1] == value)
       or (self.values[i][j+2] == value)
       or (self.values[i+1][j] == value)
       or (self.values[i+1][j+1] == value)
       or (self.values[i+1][j+2] == value)
       or (self.values[i+2][j] == value)
       or (self.values[i+2][j+1] == value)
       or (self.values[i+2][j+2] == value)):
        return True
    else:
        return False


class Tournament(object):
""" The crossover function requires two parents to be selected from the population pool. The Tournament class is used to do this.

Two individuals are selected from the population pool and a random number in [0,1] is chosen. If this number is less than the 'selection rate' (e.g. 0.85),then the fitter individual is selected; otherwise,the weaker one is selected.
"""

def __init__(self):
    return
    
def compete(self,candidates):
    """ Pick 2 random candidates from the population and get them to compete against each other. """
    c1 = candidates[random.randint(0,len(candidates)-1)]
    c2 = candidates[random.randint(0,len(candidates)-1)]
    f1 = c1.fitness
    f2 = c2.fitness

    # Find the fittest and the weakest.
    if(f1 > f2):
        fittest = c1
        weakest = c2
    else:
        fittest = c2
        weakest = c1

    selection_rate = 0.85
    r = random.uniform(0,1.1)
    while(r > 1):  # Outside [0,1] boundary. Choose another.
        r = random.uniform(0,1.1)
    if(r < selection_rate):
        return fittest
    else:
        return weakest

class CycleCrossover(object):
""" Crossover relates to the analogy of genes within each parent candidate mixing together in the hopes of creating a fitter child candidate. Cycle crossover is used here (see e.g. A. E. Eiben,J. E. Smith. Introduction to Evolutionary Computing. Springer,2007). """

def __init__(self):
    return

def crossover(self,parent1,parent2,crossover_rate):
    """ Create two new child candidates by crossing over parent genes. """
    child1 = Candidate()
    child2 = Candidate()
    
    # Make a copy of the parent genes.
    child1.values = numpy.copy(parent1.values)
    child2.values = numpy.copy(parent2.values)

    r = random.uniform(0,1.1)
        
    # Perform crossover.
    if (r < crossover_rate):
        # Pick a crossover point. Crossover must have at least 1 row (and at most Nd-1) rows.
        crossover_point1 = random.randint(0,8)
        crossover_point2 = random.randint(1,9)
        while(crossover_point1 == crossover_point2):
            crossover_point1 = random.randint(0,8)
            crossover_point2 = random.randint(1,9)
            
        if(crossover_point1 > crossover_point2):
            temp = crossover_point1
            crossover_point1 = crossover_point2
            crossover_point2 = temp
            
        for i in range(crossover_point1,crossover_point2):
            child1.values[i],child2.values[i] = self.crossover_rows(child1.values[i],child2.values[i])

    return child1,child2

def crossover_rows(self,row1,row2): 
    child_row1 = numpy.zeros(Nd)
    child_row2 = numpy.zeros(Nd)

    remaining = list(range(1,Nd+1))
    cycle = 0
    
    while((0 in child_row1) and (0 in child_row2)):  # While child rows not complete...
        if(cycle % 2 == 0):  # Even cycles.
            # Assign next unused value.
            index = self.find_unused(row1,remaining)
            start = row1[index]
            remaining.remove(row1[index])
            child_row1[index] = row1[index]
            child_row2[index] = row2[index]
            next = row2[index]
            
            while(next != start):  # While cycle not done...
                index = self.find_value(row1,next)
                child_row1[index] = row1[index]
                remaining.remove(row1[index])
                child_row2[index] = row2[index]
                next = row2[index]

            cycle += 1

        else:  # Odd cycle - flip values.
            index = self.find_unused(row1,remaining)
            start = row1[index]
            remaining.remove(row1[index])
            child_row1[index] = row2[index]
            child_row2[index] = row1[index]
            next = row2[index]
            
            while(next != start):  # While cycle not done...
                index = self.find_value(row1,next)
                child_row1[index] = row2[index]
                remaining.remove(row1[index])
                child_row2[index] = row1[index]
                next = row2[index]
                
            cycle += 1
        
    return child_row1,child_row2  
       
def find_unused(self,parent_row,remaining):
    for i in range(0,len(parent_row)):
        if(parent_row[i] in remaining):
            return i

def find_value(self,value):
    for i in range(0,len(parent_row)):
        if(parent_row[i] == value):
            return i


class Sudoku(object):
""" Solves a given Sudoku puzzle using a genetic algorithm. """

def __init__(self):
    self.given = None
    return

def load(self,path):
    # Load a configuration to solve.
    with open(path,"r") as f:
        values = numpy.loadtxt(f).reshape((Nd,Nd)).astype(int)
        self.given = Given(values)
    return

def save(self,path,solution):
    # Save a configuration to a file.
    with open(path,"w") as f:
        numpy.savetxt(f,solution.values.reshape(Nd*Nd),fmt='%d')
    return
    
def solve(self):
    Nc = 1000  # Number of candidates (i.e. population size).
    Ne = int(0.05*Nc)  # Number of elites.
    Ng = 1000  # Number of generations.
    Nm = 0  # Number of mutations.
    
    # Mutation parameters.
    phi = 0
    sigma = 1
    mutation_rate = 0.06

    # Create an initial population.
    self.population = Population()
    self.population.seed(Nc,self.given)

    # For up to 10000 generations...
    stale = 0
    for generation in range(0,Ng):
    
        print("Generation %d" % generation)
        
        # Check for a solution.
        best_fitness = 0.0
        for c in range(0,Nc):
            fitness = self.population.candidates[c].fitness
            if(fitness == 1):
                print("Solution found at generation %d!" % generation)
                print(self.population.candidates[c].values)
                return self.population.candidates[c]

            # Find the best fitness.
            if(fitness > best_fitness):
                best_fitness = fitness

        print("Best fitness: %f" % best_fitness)

        # Create the next population.
        next_population = []

        # Select elites (the fittest candidates) and preserve them for the next generation.
        self.population.sort()
        elites = []
        for e in range(0,Ne):
            elite = Candidate()
            elite.values = numpy.copy(self.population.candidates[e].values)
            elites.append(elite)

        # Create the rest of the candidates.
        for count in range(Ne,2):
            # Select parents from population via a tournament.
            t = Tournament()
            parent1 = t.compete(self.population.candidates)
            parent2 = t.compete(self.population.candidates)
            
            ## Cross-over.
            cc = CycleCrossover()
            child1,child2 = cc.crossover(parent1,crossover_rate=1.0)
            
            # # Mutate child1.
            # old_fitness = child1.fitness
            # success = child1.mutate(mutation_rate,self.given)
            # child1.update_fitness()
            # if(success):
            #     Nm += 1
            #     if(child1.fitness > float(old_fitness)):  # Used to calculate the relative success rate of mutations.
            #         phi = phi + 1
            
            # Mutate child2.
            old_fitness = child2.fitness
            success = child2.mutate(mutation_rate,self.given)
            child2.update_fitness()
            if(success):
                Nm += 1
                if(child2.fitness > old_fitness):  # Used to calculate the relative success rate of mutations.
                    phi = phi + 1
            
            # Add children to new population.
            next_population.append(child1)
            next_population.append(child2)

        # Append elites onto the end of the population. These will not have been affected by crossover or mutation.
        for e in range(0,Ne):
            next_population.append(elites[e])
            
        # Select next generation.
        self.population.candidates = next_population
        self.population.update_fitness()
        
        # Calculate new adaptive mutation rate (based on Rechenberg's 1/5 success rule). This is to stop too much mutation as the fitness progresses towards unity.
        if(Nm == 0):
            phi = 0  # Avoid divide by zero.
        else:
            phi = phi / Nm
        
        if(phi > 0.2):
            sigma = sigma/0.998
        elif(phi < 0.2):
            sigma = sigma*0.998

        mutation_rate = abs(numpy.random.normal(loc=0.0,scale=sigma,size=None))
        Nm = 0
        phi = 0

        # Check for stale population.
        self.population.sort()
        if(self.population.candidates[0].fitness != self.population.candidates[1].fitness):
            stale = 0
        else:
            stale += 1

        # Re-seed the population if 100 generations have passed with the fittest two candidates always having the same fitness.
        if(stale >= 100):
            print("The population has gone stale. Re-seeding...")
            self.population.seed(Nc,self.given)
            stale = 0
            sigma = 1
            phi = 0
            Nm = 0
            mutation_rate = 0.06
    
    print("No solution found.")
    return None
    
s = Sudoku()
s.load("puzzle_mild.txt")
solution = s.solve()
if(solution):
s.save("solution.txt",solution)

我尝试运行用于解决遗传算法数独问题的代码，但错误是这样的。我认为代码是用python2编写的，我正在尝试将其转换回python3以便我可以运行它

我也不明白为什么程序中有一种“nonetype”类型，有没有办法将其转换为“Float”类型进行比较。

文件拼图_mild.txt

0 3 0 0 7 0 0 5 0 5 0 0 1 0 6 0 0 9 0 0 1 0 0 0 4 0 0 0 9 0 0 5 0 0 6 0 6 0 0 4 0 2 0 0 7 0 4 0 0 1 0 0 3 0 0 0 2 0 0 0 8 0 0 9 0 0 3 0 5 0 0 2 0 1 0 0 2 0 0 7 0

解决方法

我不明白您的代码，而且似乎还有缩进拼写错误。

但是，Candidate 作为一个类将您的适应度值初始化为 None，对于 child1 和 child2 在 crossover 方法中。在 crossover 和 child1 返回并在您的代码中使用之前，它们永远不会在 child2 方法中被覆盖。转换为 Float 可能不是您想要的，因为您可能需要弄清楚为什么您的代码不正确，为什么它首先没有设置 fitness。

我建议为您的各个方法添加测试，以确保它们都按您的预期工作，然后再尝试让所有方法立即协同工作。

artificial-intelligence genetic-algorithm sudoku