Skip to content

Commit

Permalink
Post linting
Browse files Browse the repository at this point in the history
  • Loading branch information
metric-space committed Dec 2, 2023
1 parent 9cb16ee commit 4025e45
Show file tree
Hide file tree
Showing 2 changed files with 8 additions and 3 deletions.
2 changes: 1 addition & 1 deletion dalm/datasets/reading_comprehension_generation/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -154,7 +154,7 @@ def fix_first_prompt(text: str, chat_chain: List[Dict[str, str]]) -> List[Dict[s


# TODO: add test
# TODO: Address known issues described in #78
# TODO: Address known issues described in #78
def question_and_answer_extractor(whole_text: str, context: str) -> List[Dict[str, str]] | None:
text_lines = whole_text.split("\n")
question: List[str] = []
Expand Down
9 changes: 7 additions & 2 deletions dalm/pipelines/reading_comprehension_pipeline.py
Original file line number Diff line number Diff line change
Expand Up @@ -257,9 +257,14 @@ def parse_args() -> argparse.Namespace:
"--domain_spm_path",
type=str,
default=None,
help="path to the domain tokenizer used for regex based generation. If None is provided (default), it will be automatically generated.",
help=(
"path to the domain tokenizer used for regex based generation."
"If None is provided (default), it will be automatically generated."
),
)
parser.add_argument(
"--input", type=str, required=True, help="A CSV file OR a directory containing the CSV input files"
)
parser.add_argument("--input", type=str, required=True, help="A CSV file OR a directory containing the CSV input files")
parser.add_argument("--csv_column", type=str, help="Column to read from the CSV file")
parser.add_argument("--no_chunk", action="store_true", help="whether to NOT chunk the input files or not")
parser.add_argument("--num_train_epochs", type=int, default=1, help="number of epochs to train the generator")
Expand Down

0 comments on commit 4025e45

Please sign in to comment.