Spaces:
Running
Running
# To use default value, set to null | |
leafmachine: | |
use_RGB_label_images: True | |
do: | |
check_for_illegal_filenames: False | |
check_for_corrupt_images_make_vertical: False | |
print: | |
verbose: True | |
optional_warnings: True | |
logging: | |
log_level: null | |
# Overall Project Input Settings | |
project: | |
# Image to Process | |
dir_images_local: 'D:\Dropbox\LM2_Env\VoucherVision_Datasets\2022_09_07_thru12_S3_jacortez_AllAsia' # 'D:/Dropbox/LM2_Env/VoucherVision_Datasets/Compare_Set_Easy_10imgs/imgs' #'D:\D_Desktop\Richie\Imgs' #'D:/Dropbox/LM2_Env/Image_Datasets/Acacia/Acacia_prickles_4-26-23_LANCZOS/images/short' #'D:\D_Desktop\Richie\Imgs' #'home/brlab/Dropbox/LM2_Env/Image_Datasets/Manuscript_Images' # 'D:\Dropbox\LM2_Env\Image_Datasets\SET_FieldPrism_Test\TESTING_OUTPUT\Images_Processed\REU_Field_QR-Code-Images\Cannon_Corrected\Images_Corrected' # 'F:\temp_3sppFamily' # 'D:/Dropbox/LM2_Env/Image_Datasets/GBIF_BroadSample_3SppPerFamily' # SET_Diospyros/images_short' # 'D:/Dropbox/LM2_Env/Image_Datasets/SET_Diospyros/images_short' #'D:\Dropbox\LM2_Env\Image_Datasets\GBIF_BroadSample_Herbarium' #'D:/Dropbox/LM2_Env/Image_Datasets/SET_Diospyros/images_short' # str | only for image_location:local | full path for directory containing images | |
# dir_images_local: 'D:/Dropbox/LM2_Env/VoucherVision_Datasets/Compare_Set_Easy_10imgs/imgs' #'D:\D_Desktop\Richie\Imgs' #'D:/Dropbox/LM2_Env/Image_Datasets/Acacia/Acacia_prickles_4-26-23_LANCZOS/images/short' #'D:\D_Desktop\Richie\Imgs' #'home/brlab/Dropbox/LM2_Env/Image_Datasets/Manuscript_Images' # 'D:\Dropbox\LM2_Env\Image_Datasets\SET_FieldPrism_Test\TESTING_OUTPUT\Images_Processed\REU_Field_QR-Code-Images\Cannon_Corrected\Images_Corrected' # 'F:\temp_3sppFamily' # 'D:/Dropbox/LM2_Env/Image_Datasets/GBIF_BroadSample_3SppPerFamily' # SET_Diospyros/images_short' # 'D:/Dropbox/LM2_Env/Image_Datasets/SET_Diospyros/images_short' #'D:\Dropbox\LM2_Env\Image_Datasets\GBIF_BroadSample_Herbarium' #'D:/Dropbox/LM2_Env/Image_Datasets/SET_Diospyros/images_short' # str | only for image_location:local | full path for directory containing images | |
image_location: 'local' | |
continue_run_from_partial_xlsx: 'D:\Dropbox\LM2_Env\VoucherVision_Datasets\POC_chatGPT__2022_09_07_thru12_S3_jacortez_AllAsia\2022_09_07_thru12_S3_jacortez_AllAsia\Transcription\transcribed.xlsx' | |
# continue_run_from_partial_xlsx: null | |
# Project Output Dir | |
dir_output: 'D:/Dropbox/LM2_Env/VoucherVision_Datasets/POC_chatGPT__2022_09_07_thru12_S3_jacortez_AllAsia' # 'D:/Dropbox/LM2_Env/Image_Datasets/TEST_LM2' # 'D:\D_Desktop\Richie\Richie_Out' | |
run_name: 'POC_chatGPT' #'images_short_TEST' #'images_short_landmark' | |
prefix_removal: 'MICH-V-' | |
suffix_removal: '' | |
catalog_numerical_only: True | |
# Embeddings and LLM | |
use_domain_knowledge: True | |
embeddings_database_name: 'EmbeddingsDB_all_asia_minimal_InRegion' | |
build_new_embeddings_database: False | |
path_to_domain_knowledge_xlsx: 'D:\Dropbox\LeafMachine2\leafmachine2\transcription\domain_knowledge/AllAsiaMinimalasof25May2023_2__InRegion.xlsx' #'D:/Dropbox/LeafMachine2/leafmachine2/transcription/domain_knowledge/AllAsiaMinimalasof25May2023_2__TRIMMEDtiny.xlsx' | |
batch_size: 500 #null # null = all | |
num_workers: 1 # int |DEFAULT| 4 # More is not always better. Most hardware loses performance after 4 | |
modules: | |
specimen_crop: True | |
LLM_version: 'chatGPT' # from 'chatGPT' OR 'PaLM' | |
cropped_components: | |
# empty list for all, add to list to IGNORE, lowercase, comma seperated | |
# archival |FROM| | |
# ruler, barcode, colorcard, label, map, envelope, photo, attached_item, weights | |
# plant |FROM| | |
# leaf_whole, leaf_partial, leaflet, seed_fruit_one, seed_fruit_many, flower_one, flower_many, bud, specimen, roots, wood | |
do_save_cropped_annotations: True | |
save_cropped_annotations: ['label','barcode'] # 'save_all' to save all classes | |
save_per_image: False # creates a folder for each image, saves crops into class-names folders # TODO | |
save_per_annotation_class: True # saves crops into class-names folders | |
binarize_labels: False | |
binarize_labels_skeletonize: False | |
data: | |
save_json_rulers: False | |
save_json_measurements: False | |
save_individual_csv_files_rulers: False | |
save_individual_csv_files_measurements: False | |
include_darwin_core_data_from_combined_file: False | |
do_apply_conversion_factor: False ########################### | |
overlay: | |
save_overlay_to_pdf: True | |
save_overlay_to_jpgs: True | |
overlay_dpi: 300 # int |FROM| 100 to 300 | |
overlay_background_color: 'black' # str |FROM| 'white' or 'black' | |
show_archival_detections: True | |
ignore_archival_detections_classes: [] | |
show_plant_detections: True | |
ignore_plant_detections_classes: ['leaf_whole', 'specimen'] #['leaf_whole', 'leaf_partial', 'specimen'] | |
show_segmentations: True | |
show_landmarks: True | |
ignore_landmark_classes: [] | |
line_width_archival: 2 # int | |
line_width_plant: 6 # int | |
line_width_seg: 12 # int # thick = 12 | |
line_width_efd: 6 # int # thick = 3 | |
alpha_transparency_archival: 0.3 # float between 0 and 1 | |
alpha_transparency_plant: 0 | |
alpha_transparency_seg_whole_leaf: 0.4 | |
alpha_transparency_seg_partial_leaf: 0.3 | |
# Configure Archival Component Detector | |
archival_component_detector: | |
# ./leafmachine2/component_detector/runs/train/detector_type/detector_version/detector_iteration/weights/detector_weights | |
detector_type: 'Archival_Detector' | |
detector_version: 'PREP_final' | |
detector_iteration: 'PREP_final' | |
detector_weights: 'best.pt' | |
minimum_confidence_threshold: 0.5 | |
do_save_prediction_overlay_images: True | |
ignore_objects_for_overlay: [] # list[str] # list of objects that can be excluded from the overlay # all = null | |