Skip to content

Commit 81413fd

Browse files
committed
made small tweaks to cleaning module
1 parent e154cc1 commit 81413fd

File tree

3 files changed

+6
-5
lines changed

3 files changed

+6
-5
lines changed

text_extensions_for_pandas/cleaning/__init__.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -14,10 +14,11 @@
1414
#
1515

1616
################################################################################
17-
# io module
17+
# cleaning module
1818
#
19-
# Functions in text_extensions_for_pandas that create DataFrames and convert
20-
# them to other formats.
19+
# Functions in text_extensions_for_pandas that allow for identification of
20+
# possibly incorrect labels, and quick training of models on bert embeddings
21+
# of a corpus
2122

2223
# Expose the public APIs that users should get from importing the top-level
2324
# library.

text_extensions_for_pandas/cleaning/analysis.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,7 @@
2020

2121
import numpy as np
2222
import pandas as pd
23+
from typing import *
2324

2425
import text_extensions_for_pandas as tp
2526

@@ -28,7 +29,6 @@
2829

2930
tp = importlib.reload(tp)
3031

31-
from typing import *
3232

3333

3434
def create_f1_score_report(

text_extensions_for_pandas/cleaning/preprocess.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -269,7 +269,7 @@ def preprocess_documents(
269269
else:
270270
for fold in bert_docs_by_fold.keys():
271271
for docnum in range(len(bert_docs_by_fold[fold])):
272-
bert_docs_by_fold[fold][docnum][iob_col].fillna(
272+
bert_docs_by_fold[fold][docnum][label_col].fillna(
273273
default_label_type, inplace=True
274274
)
275275
bert_docs_by_fold[fold][docnum][

0 commit comments

Comments
 (0)