7-Add-database-to-project #14
7 changed files with 6687 additions and 22 deletions
|
|
@ -11,7 +11,7 @@ class AppleNotesParser(BaseNotesParser):
|
||||||
"""Parser for Apple Notes format training data."""
|
"""Parser for Apple Notes format training data."""
|
||||||
|
|
||||||
def __init__(self):
|
def __init__(self):
|
||||||
super().__init__("apple.md", unique_apple_exercises_mapper)
|
super().__init__("complete_data/apple.md", unique_apple_exercises_mapper)
|
||||||
|
|
||||||
def filter_training_data(self, training_data: str) -> str:
|
def filter_training_data(self, training_data: str) -> str:
|
||||||
"""Filter Apple-specific training data format."""
|
"""Filter Apple-specific training data format."""
|
||||||
|
|
|
||||||
|
|
@ -11,7 +11,7 @@ class ObsidianNotesParser(BaseNotesParser):
|
||||||
|
|
||||||
def __init__(self):
|
def __init__(self):
|
||||||
super().__init__(
|
super().__init__(
|
||||||
data_file_name="obsidian.md",
|
data_file_name="complete_data/obsidian.md",
|
||||||
exercise_mapper=obsidian_unique_exercies_mapping,
|
exercise_mapper=obsidian_unique_exercies_mapping,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -5,28 +5,23 @@ from pprint import pprint
|
||||||
|
|
||||||
|
|
||||||
om = ObsidianNotesParser()
|
om = ObsidianNotesParser()
|
||||||
obsidian_result = defaultdict(int)
|
o_mapped_trainings = om.parse_training_data()
|
||||||
o_mapped_trainings = om.parse_and_map_training_data()
|
|
||||||
for training in o_mapped_trainings:
|
|
||||||
for exercise in training.exercises:
|
|
||||||
obsidian_result[exercise.name] += 1
|
|
||||||
|
|
||||||
am = AppleNotesParser()
|
am = AppleNotesParser()
|
||||||
apple_result = defaultdict(int)
|
a_mapped_trainings = am.parse_training_data()
|
||||||
a_mapped_trainings = am.parse_and_map_training_data()
|
|
||||||
for training in a_mapped_trainings:
|
|
||||||
for exercise in training.exercises:
|
|
||||||
apple_result[exercise.name] += 1
|
|
||||||
|
|
||||||
print(f"apple trainings:\t{len(a_mapped_trainings)}")
|
combined_list = o_mapped_trainings + a_mapped_trainings
|
||||||
print(f"osididian trainings:\t{len(o_mapped_trainings)}")
|
print(len(combined_list))
|
||||||
|
|
||||||
overall_trainings = a_mapped_trainings + o_mapped_trainings
|
comb_uniques_names = defaultdict(int)
|
||||||
print(f"overall trainings:\t{len(overall_trainings)}")
|
exercise_names = list()
|
||||||
|
|
||||||
overall_result = defaultdict(int)
|
for training in combined_list:
|
||||||
for training in overall_trainings:
|
if training.exercises:
|
||||||
for exercise in training.exercises:
|
for exercise in training.exercises:
|
||||||
overall_result[exercise.name] += 1
|
exercise_names.append(exercise.name)
|
||||||
|
comb_uniques_names[exercise.name] += 1
|
||||||
|
|
||||||
pprint(overall_result)
|
|
||||||
|
# pprint(set(exercise_names))
|
||||||
|
pprint(comb_uniques_names)
|
||||||
|
|
|
||||||
1086
data/apple_original_backup.md
Normal file
1086
data/apple_original_backup.md
Normal file
File diff suppressed because it is too large
Load diff
1086
data/complete_data/apple.md
Normal file
1086
data/complete_data/apple.md
Normal file
File diff suppressed because it is too large
Load diff
2249
data/complete_data/obsidian.md
Normal file
2249
data/complete_data/obsidian.md
Normal file
File diff suppressed because it is too large
Load diff
2249
data/obsidian_original_backup.md
Normal file
2249
data/obsidian_original_backup.md
Normal file
File diff suppressed because it is too large
Load diff
Loading…
Reference in a new issue