LCS-Income/lcs.py~ at master · James-Patrick/LCS-Income

341 lines (250 loc) · 9.25 KB
# -*- coding: utf-8 -*-
#import ea.py
import random_rules
import time, sys, getopt, ast
''' Notes '''
# After a while, we need to choose a number where the classifier is sufficiently experienced enough to be deleted if it's fitness is too low
''' (Not used)
HEADINGS_DICT = {'age': 'continuous', 
			'workclass': 'discrete',
			'fnlwgt': 'continuous',
			'education':'discrete',
			'education-num': 'continuous',
			'marital-status': 'discrete',
			'occupation':'discrete',
			'relationship':'discrete',
			'race':'discrete',
			'sex':'discrete',
			'capital-gain':'continuous',
			'capital-loss':'continuous',
			'hours-per-week':'continuous',
			'native-country':'discrete',
			'salary':'class-label'}
FILENAME = 'adult.data'
HEADINGS = ['age', 'workclass', 'fnlwgt', 'education', 'education-num',	'marital-status', 'occupation', 'relationship', 'race',	'sex', 'capital-gain', 'capital-loss',	'hours-per-week', 'native-country', 'salary']
CLASS_LABELS = ['<=50K', '>50K']
NUM_CLASSIFIERS = 500
LEARN_MODE    = 0
CLASSIFY_MODE = 1
CLASSIFIERS_FILE = "classifiers"
verbose = False
def make_verbose():
	global verbose
	verbose = True
# A classifier. 
# Contains a condition, an action, a fitness value
class Classifier:
	__all__ = set()
	def __init__(self, condition = None, action = None, duplicate = True, from_dict = False):
		if from_dict:
			self.read_from_dictionary(from_dict)
		  if condition:
			  self.condition = condition
			  self.condition = random_rules.generate_condition()
		  if action:
			  self.action = action
			  self.action = random_rules.generate_action(CLASS_LABELS)
		  self.prediction 	= 0.0
		  self.fitness 		= 0.0
		  self.error			= 0.0
		  self.experience 	= 0
		  self.times_correct 	= 0
		  self.times_wrong 	= 0
		  self.accuracy		= 0.0
		# Duplicate this classifier, creating the same classifier but for the inverse rule
		if duplicate:
			def flipped_action(action):
				if action == '<=50K':
					return '>50K'
					return '<=50K'
			dc = Classifier(self.condition, flipped_action(self.action), False)
		self.__class__.__all__.add(self)
		#self.test = random_rules.generate_condition()
	# Checks if condition is met in environment
	def check_condition(self, environment):
		for k, v in self.condition.items():
			if environment.dictionary[k] != v:
				return False			# One condition of this classifier was not met				
		return True	
	# Learns from the environment. Checks whether the rule held by the classifier is correct or not, depending on whether its conditions are met in the environment
	def learn(self, environment):
		# Updates the classifier's parameters based on whether it was correct or incorrect.
		def update_classifier(was_correct):
			self.experience += 1
			if was_correct:
				self.times_correct += 1 
				self.accuracy = self.times_correct * 1.0 / self.experience * 1.0
				self.times_wrong += 1
			#self.accuracy =
		# If this classifier has met all its conditions on the environment, add +1 experience points and return the classifier's action
		# (which in this case is either <= 50K or > 50K)
		if self.check_condition(environment):
			was_correct = (self.action == environment.correct_class)	
			update_classifier(was_correct)
			#self.print_details()
#			return self.action
#			return None
	def classify(self, environment):
		if self.check_condition(environment):
			return (self.accuracy, self.action)
	# Prints the details of the classifier in a nice, easy-to-read manner.
	def print_details(self):
		if verbose:
		#	print("{0:<15s} : {1}".format("Classifier #", self.id))
			print("{0:<15s} : {1}".format("Condition:", self.condition))
			print("{0:<15s} : {1}".format("Action:", self.action))
		#	print("{0:<15s} : {1}".format("Prediction:", self.prediction))
			print("{0:<15s} : {1}".format("Fitness:", self.fitness))
			print("{0:<15s} : {1}".format("Experience:", self.experience))
			print("{0:<15s} : {1}".format("Times Correct:", self.times_correct))
			print("{0:<15s} : {1}".format("Times Wrong:", self.times_wrong))
			print("{0:<15s1} : {1}".format("Accuracy:", self.accuracy * 100))
		#	print("{0:<15s} : {1}".format("Error:", self.error))		
	# Outputs the classifier's info as a dictionary
	def to_dictionary(self):
		to_dict = {}
	#	to_dict["id"] = self.id
		to_dict["condition"] = self.condition
		to_dict["action"] = self.action
		to_dict["accuracy"] = self.accuracy
		to_dict["experience"] = self.experience	  
		return to_dict
	# Inputs the classifiers info from a dictionary
	def read_from_dictionary(self, from_dict):
	#	self.id = from_dict["id"]
		self.condition = from_dict["condition"]
		self.action = from_dict["action"]
		self.accuracy = from_dict["accuracy"]
		self.experience	= from_dict["experience"]
# One environment (a dictionary that maps field names to their values).	
# For example, 
#   {'education': 'HS-grad', 'workclass': 'Local-gov', 'age': 67 ...}
# self.correct_class = The correct class label for this particular environment.
class Environment:
	def __init__(self, data):
		self.dictionary = {}
		for h in range(len(HEADINGS) - 1):
			# Convert field to integer if it is numeric, otherwise keep it as a string (so it may handle discrete/continuous variables).
			self.dictionary[HEADINGS[h]] = int(data[h]) if unicode(data[h]).isnumeric() else data[h]
		self.correct_class = data[len(HEADINGS) - 1]
	# Prints the details of the environment in a nice, easy-to-read manner.
	def print_details(self):
		if verbose:			#match_set  = []
			#action_set = []
			for k, v in self.dictionary.items():
				print("{0:<20s} : {1}".format(k, v))
			print("----------------------------")
			print("{0:<20s} : {1}".format("Correct class", self.correct_class))
def main(argv):
	def print_usage():
		print('--------------------------')
		print('lcs.py usage')
		print('--------------------------')
		print('Options:')
		print('-v verbose (print output)')
		print('-l Learn mode (default)')
		print('-c Classify mode')
	mode = LEARN_MODE
		opts, args = getopt.getopt(argv, "hvlc")
	except getopt.GetoptError:			#match_set  = []
			#action_set = []
		print_usage()
		sys.exit(2)
	for opt, arg in opts:
		if opt == '-h':
			print_usage()
			sys.exit()
		elif opt == '-v':
			make_verbose()
		elif opt == '-l':
			mode = LEARN_MODE
		elif opt == '-c':
			mode = CLASSIFY_MODE
	# Creates a list of environments.
	# Environments are stored as objects, which contain a dictionary, and a correct_class.
	def create_environments():	
		with open(FILENAME, "r") as file:		
			data = [f.replace(' ', '').rstrip().split(',') for f in file.readlines()]
		return [Environment(d) for d in data]
	environments = create_environments()
	def do_learn_mode():
		# Creates the initial population of classifiers, in the form of a list.
		def create_classifiers():
			for x in range(NUM_CLASSIFIERS):
			  Classifier()
			return Classifier.__all__
		# Writes all classifiers to a file, in dictionary format
		def write_classifiers(classifiers, output_file):
			for c in classifiers:
				output_file.write(str(c.to_dictionary()))
				output_file.write('\n')
		# One timestep. 
		def step(environment, classifiers):
			for c in classifiers:
				c.learn(environment)
		time_start = time.time()
		classifiers  = create_classifiers()
		if verbose:
			for c in classifiers:
				c.print_details()
			print('------------------------------------') 
		for x in range(len(environments)):		
			step(environments[x], classifiers);
		time_end = time.time()
		total_time = time_end - time_start
		print(total_time, "seconds")
		output_file = open(CLASSIFIERS_FILE, "w")
		write_classifiers(classifiers, output_file)		
	def do_classify_mode():
		def read_classifiers():
			print("Reading classifiers...")			
			with open(CLASSIFIERS_FILE, "r") as file:
				classifier_dict = [ast.literal_eval(l) for l in file.readlines()]
			return [Classifier(from_dict = k) for k in classifier_dict]
		# One timestep. 
		def step(environment, classifiers, total_correct, total_seen):
			match_set = []
			for c in classifiers:
				cl = c.classify(environment)			# [classifier, action, accuracy]
					match_set.append(cl)
			sorted_set = sorted(match_set, key=lambda tup: tup[1])
			if len(sorted_set) > 0:
			  action = sorted_set[0][1]
			  if action == environment.correct_class:
				  correct = "Correct!"
				  total_correct += 1
				  correct = "Fail    "
			  print("Action:", sorted_set[0][1], " | Accuracy:", "%.2f" % (sorted_set[0][0] * 100), "% |", correct, "{", total_correct, total_seen, "(", "%.5f" % (total_correct * 1.0 / total_seen * 1.0 * 100), ") }")
				"No classification can be made."
			return total_correct
		classifiers = read_classifiers()
		total_correct = 0
		total_seen = 0
		for x in range(len(environments)):		
			total_seen += 1
			total_correct = step(environments[x], classifiers, total_correct, total_seen);		  
	if mode == LEARN_MODE:
		do_learn_mode()
		do_classify_mode()
if __name__ == "__main__":
    main(sys.argv[1:])	
''' Notes '''
# Look at all classifiers in the match set
# Look at the classifier in M with highest accuracy
# Action set = all classifiers with that same class label as action
# Reward = given when it is part of the action set
# Prediction p , estimate payoff when rule is seen
# Accuracy relative to others
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

lcs.py~

Latest commit

History

lcs.py~

File metadata and controls