Skip to content

Commit 423dab9

Browse files
committed
CU-8699049kf: Fix a few v2 vs v2 access issues
1 parent a2e9726 commit 423dab9

File tree

4 files changed

+19
-17
lines changed

4 files changed

+19
-17
lines changed

medcat/2_train_model/1_unsupervised_training/unsupervised_medcattraining.py

Lines changed: 9 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -28,13 +28,14 @@
2828
df = cs.DataFrame(index=cogstack_indices, columns=text_columns) # type: ignore
2929

3030
cat = CAT.load_model_pack(model_pack_path+model_pack_name)
31-
cat.cdb.print_stats()
32-
cat.train(data_iterator=df[text_columns].iterrows(),
33-
nepochs=1,
34-
fine_tune=True,
35-
progress_print=10000,
36-
is_resumed=False)
31+
print(cat.cdb.get_basic_info())
32+
cat.trainer.train_unsupervised(
33+
data_iterator=df[text_columns].iterrows(),
34+
nepochs=1,
35+
fine_tune=True,
36+
progress_print=10000,
37+
is_resumed=False)
3738

38-
cat.cdb.print_stats()
39+
print(cat.cdb.get_basic_info())
3940

40-
cat.create_model_pack(save_dir_path=model_pack_path, model_pack_name=output_modelpack_name)
41+
cat.save_model_pack(save_dir_path=model_pack_path, model_pack_name=output_modelpack_name)

medcat/2_train_model/1_unsupervised_training/unsupervised_training.py

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,4 @@
1+
from medcat.cat import logger as cat_logger
12
from medcat.cat import CAT
23
import pandas as pd
34
import os
@@ -44,25 +45,25 @@
4445
# Load modelpack
4546
print('Loading modelpack')
4647
cat = CAT.load_model_pack(model_pack_path)
47-
cat.log.addHandler(logging.StreamHandler()) # add console output
48+
cat_logger.addHandler(logging.StreamHandler()) # add console output
4849

4950
print('STATS:')
50-
cat.cdb.print_stats()
51+
print(cat.cdb.get_basic_info())
5152

5253
# CHANGE AS NEEDED - if the number of spligt files is different
5354
all_data_files = [f'split_notes_5M_{nr}.csv' for nr in range(1, 20)] # file containing training material.
5455
for i, data_file in enumerate(all_data_files):
5556
# Load training data
5657
print('Load data for', i, 'from', data_file)
5758
data = pd.read_csv(os.path.join(data_dir, data_file))
58-
cat.train(data.text.values, progress_print=100)
59+
cat.trainer.train_unsupervised(data.text.values, progress_print=100)
5960

6061
print('Stats now, after', i)
61-
cat.cdb.print_stats()
62+
print(cat.cdb.get_basic_info())
6263

6364
# save modelpack
64-
cat.create_model_pack(save_dir_path=model_dir, model_pack_name=f"{output_modelpack}_{i}")
65+
cat.save_model_pack(save_dir_path=model_dir, model_pack_name=f"{output_modelpack}_{i}")
6566

6667
# save modelpack - ALL
67-
cat.create_model_pack(save_dir_path=model_dir, model_pack_name=output_modelpack)
68+
cat.save_model_pack(save_dir_path=model_dir, model_pack_name=output_modelpack)
6869

medcat/3_run_model/run_model.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,7 @@
5959
else:
6060
snomed_filter = set(cat.cdb.cui2info.keys())
6161

62-
cat.config.linking.filters.cuis = snomed_filter
62+
cat.config.components.linking.filters.cuis = snomed_filter
6363
del snomed_filter
6464

6565
# build query, change as appropriate

medcat/compare_models/compare.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -154,8 +154,8 @@ def get_diffs_for(model_pack_path_1: str,
154154
if show_progress:
155155
print("After adding children from 2nd model have a total of",
156156
len(cui_filter), "CUIs")
157-
cat1.config.linking.filters.cuis = cui_filter
158-
cat2.config.linking.filters.cuis = cui_filter
157+
cat1.config.components.linking.filters.cuis = cui_filter
158+
cat2.config.components.linking.filters.cuis = cui_filter
159159
ann_diffs = get_per_annotation_diffs(cat1, cat2, documents, keep_raw=keep_raw,
160160
doc_limit=doc_limit)
161161
if show_progress:

0 commit comments

Comments
 (0)