ydshieh
commited on
Commit
•
09d2e16
1
Parent(s):
6984f2b
add instructions for downloading coco
Browse files- coco_dataset/download_coco.txt +12 -0
- usage_example.txt +2 -0
coco_dataset/download_coco.txt
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
mkdir data
|
2 |
+
cd data
|
3 |
+
wget http://images.cocodataset.org/zips/train2017.zip
|
4 |
+
wget http://images.cocodataset.org/zips/val2017.zip
|
5 |
+
wget http://images.cocodataset.org/zips/test2017.zip
|
6 |
+
wget http://images.cocodataset.org/annotations/annotations_trainval2017.zip
|
7 |
+
wget http://images.cocodataset.org/annotations/image_info_test2017.zip
|
8 |
+
unzip train2017.zip
|
9 |
+
unzip val2017.zip
|
10 |
+
unzip test2017.zip
|
11 |
+
unzip annotations_trainval2017.zip
|
12 |
+
unzip image_info_test2017.zip
|
usage_example.txt
CHANGED
@@ -1,3 +1,5 @@
|
|
1 |
python3 run_image_captioning_flax.py --dataset_name ./coco_dataset/coco_dataset.py --dataset_config_name=2017 --data_dir ./coco_dataset/dummy_data/ --caption_column caption --image_column image_path --max_target_length 8 --num_beams 2 --output_dir debug --do_train --per_device_train_batch_size 2 --do_eval --per_device_eval_batch_size 4 --do_predict --max_train_samples 16 --max_eval_samples 16 --max_predict_samples 16 --preprocessing_num_workers 2 --num_train_epochs 3 --learning_rate 3e-5 --do_predict_after_evaluation --predict_with_generate --logging_steps 2 --block_size 8 --encoder_model_name_or_path ./encoder-decoder/encoder/ --decoder_model_name_or_path ./encoder-decoder/decoder/
|
2 |
|
|
|
|
|
3 |
python3 run_image_captioning_flax.py --dataset_name ./image_caption_dataset/image_caption_dataset.py --dataset_config_name=coco_2017 --data_dir ./image_caption_dataset/coco_dataset/ --caption_column en --image_column image_path --max_target_length 8 --num_beams 2 --output_dir debug --do_train --per_device_train_batch_size 2 --do_eval --per_device_eval_batch_size 4 --do_predict --max_train_samples 16 --max_eval_samples 16 --max_predict_samples 16 --preprocessing_num_workers 2 --num_train_epochs 3 --learning_rate 3e-5 --do_predict_after_evaluation --predict_with_generate --logging_steps 2 --block_size 8 --encoder_model_name_or_path ./encoder-decoder/encoder/ --decoder_model_name_or_path ./encoder-decoder/decoder
|
1 |
python3 run_image_captioning_flax.py --dataset_name ./coco_dataset/coco_dataset.py --dataset_config_name=2017 --data_dir ./coco_dataset/dummy_data/ --caption_column caption --image_column image_path --max_target_length 8 --num_beams 2 --output_dir debug --do_train --per_device_train_batch_size 2 --do_eval --per_device_eval_batch_size 4 --do_predict --max_train_samples 16 --max_eval_samples 16 --max_predict_samples 16 --preprocessing_num_workers 2 --num_train_epochs 3 --learning_rate 3e-5 --do_predict_after_evaluation --predict_with_generate --logging_steps 2 --block_size 8 --encoder_model_name_or_path ./encoder-decoder/encoder/ --decoder_model_name_or_path ./encoder-decoder/decoder/
|
2 |
|
3 |
+
python3 run_image_captioning_flax.py --dataset_name ./coco_dataset/coco_dataset.py --dataset_config_name=2017 --data_dir ./coco_dataset/data/ --caption_column caption --image_column image_path --max_target_length 8 --num_beams 2 --output_dir debug --do_train --per_device_train_batch_size 2 --do_eval --per_device_eval_batch_size 4 --do_predict --max_train_samples 16 --max_eval_samples 16 --max_predict_samples 16 --preprocessing_num_workers 2 --num_train_epochs 3 --learning_rate 3e-5 --do_predict_after_evaluation --predict_with_generate --logging_steps 2 --block_size 8 --encoder_model_name_or_path ./encoder-decoder/encoder/ --decoder_model_name_or_path ./encoder-decoder/decoder/
|
4 |
+
|
5 |
python3 run_image_captioning_flax.py --dataset_name ./image_caption_dataset/image_caption_dataset.py --dataset_config_name=coco_2017 --data_dir ./image_caption_dataset/coco_dataset/ --caption_column en --image_column image_path --max_target_length 8 --num_beams 2 --output_dir debug --do_train --per_device_train_batch_size 2 --do_eval --per_device_eval_batch_size 4 --do_predict --max_train_samples 16 --max_eval_samples 16 --max_predict_samples 16 --preprocessing_num_workers 2 --num_train_epochs 3 --learning_rate 3e-5 --do_predict_after_evaluation --predict_with_generate --logging_steps 2 --block_size 8 --encoder_model_name_or_path ./encoder-decoder/encoder/ --decoder_model_name_or_path ./encoder-decoder/decoder
|