Knowledge-Graph-Completion/graph_completion.py at master · twiet/Knowledge-Graph-Completion · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
import abc

class graph_completion(abc.ABC):
	# The output of each of the following methods should be defined clearly and shared between all methods implemented by members of the group.

	@abc.abstractmethod
	def read_dataset(self, fileName, options={}):
		"""
		Reads a dataset in preparation for: train or test. Returns data in proper format for: train or test.

		Args:
			fileName: Name of file representing the dataset to read
			options: object to store any extra or implementation specific data

		Returns:
			Iterable data, optionally split into train, test, and possibly dev.
		"""
		pass


	@abc.abstractmethod
	def train(self, data, options={}):
		"""
		Trains a model on the given input data

		Args:
			data: iterable of arbitrary format
			options: object to store any extra or implementation specific data

		Returns:
			ret: None. Trained model stored internally to instance's state.
		"""
		pass


	@abc.abstractmethod
	def predict(self, data, options={}):
		"""
		Predicts on the given input data (e.g. knowledge graph). Assumes model has been trained with train()

		Args:
			data: iterable of arbitrary format. represents the data instances and features you use to make predictions
				Note that prediction requires trained model. Precondition: instance already stores trained model
				information.
			options: object to store any extra or implementation specific data

		Returns:
			predictions: [tuple,...], i.e. list of predicted tuples.
				Each tuple likely will follow format: (subject_entity, relation, object_entity), but isn't required.
		"""
		pass

	@abc.abstractmethod
	def evaluate(self, benchmark_data, metrics={}, options={}):
		"""
		Calculates evaluation metrics on chosen benchmark dataset.
		Precondition: model has been trained and predictions were generated from predict()

		Args:
			benchmark_data: Iterable testing split of dataset to evaluate on
			metrics: Dictionary of function pointers for desired evaluation metrics (e.g. F1, MRR, etc.)
				- Note: This abstract base class does not enforce a metric because some metrics are more appropriate
				for a given benchmark than others. At least one metric should be specified
				- example format:
					metrics = {
						"F1": f1_eval_function,
						"MRR": mrr_eval_function
					}
			options: object to store any extra or implementation specific data

		Returns:
			evaluations: dictionary of scores with respect to chosen metrics
				- e.g.
					evaluations = {
						"f1": 0.5,
						"MRR": 0.8
					}
		"""
		pass