Skip to content

Commit

Permalink
* minor modifications
Browse files Browse the repository at this point in the history
  • Loading branch information
HYLcool committed Nov 13, 2023
1 parent 23e4e3a commit acaeb10
Show file tree
Hide file tree
Showing 3 changed files with 2 additions and 3 deletions.
2 changes: 1 addition & 1 deletion configs/config_all.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -116,7 +116,7 @@ process:
use_words_aug: false # whether to augment words, especially for Chinese and Vietnamese
words_aug_group_sizes: [2] # the group size of words to augment
words_aug_join_char: "" # the join char between words to augment
- image_aspect_ratio_filter: # filter samples according to the aspect ratios of images in them
- image_aspect_ratio_filter: # filter samples according to the aspect ratios of images (a fraction of width by height, r=w/h) in them
min_ratio: 0.333 # the min aspect ratio of filter range
max_ratio: 3.0 # the max aspect ratio of filter range
any_or_all: any # keep this sample when any/all images meet the filter condition
Expand Down
1 change: 0 additions & 1 deletion data_juicer/config/config.py
Original file line number Diff line number Diff line change
Expand Up @@ -437,7 +437,6 @@ def sort_op_by_types_and_names(op_name_classes):

def config_backup(cfg):
cfg_path = cfg.config[0].absolute
cfg.cfg_path = os.path.dirname(cfg_path) # record the path of config
work_dir = cfg.work_dir
target_path = os.path.join(work_dir, os.path.basename(cfg_path))
logger.info(f'Back up the input config file [{cfg_path}] into the '
Expand Down
2 changes: 1 addition & 1 deletion data_juicer/ops/base_op.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,7 @@ def __init__(self,
image_key: str = None,
):
"""
Base class that conducts text editing.
Base class that conducts data editing.
:param text_key: the key name of field that stores sample texts
to be processed.
Expand Down

0 comments on commit acaeb10

Please sign in to comment.