|
<?xml version="1.0" encoding="UTF-8"?> |
|
<project version="4"> |
|
<component name="AutoImportSettings"> |
|
<option name="autoReloadType" value="SELECTIVE" /> |
|
</component> |
|
<component name="ChangeListManager"> |
|
<list default="true" id="c9169370-1a11-41d7-9648-02694630edd2" name="Changes" comment=""> |
|
<change beforePath="$PROJECT_DIR$/README.md" beforeDir="false" afterPath="$PROJECT_DIR$/README.md" afterDir="false" /> |
|
<change beforePath="$PROJECT_DIR$/wav2vec2-base-turkish/preprocessor_config.json" beforeDir="false" afterPath="$PROJECT_DIR$/wav2vec2-base-turkish/preprocessor_config.json" afterDir="false" /> |
|
<change beforePath="$PROJECT_DIR$/wav2vec2-base-turkish/special_tokens_map.json" beforeDir="false" afterPath="$PROJECT_DIR$/wav2vec2-base-turkish/special_tokens_map.json" afterDir="false" /> |
|
<change beforePath="$PROJECT_DIR$/wav2vec2-base-turkish/tokenizer_config.json" beforeDir="false" afterPath="$PROJECT_DIR$/wav2vec2-base-turkish/tokenizer_config.json" afterDir="false" /> |
|
</list> |
|
<option name="SHOW_DIALOG" value="false" /> |
|
<option name="HIGHLIGHT_CONFLICTS" value="true" /> |
|
<option name="HIGHLIGHT_NON_ACTIVE_CHANGELIST" value="false" /> |
|
<option name="LAST_RESOLUTION" value="IGNORE" /> |
|
</component> |
|
<component name="FileTemplateManagerImpl"> |
|
<option name="RECENT_TEMPLATES"> |
|
<list> |
|
<option value="Python Script" /> |
|
</list> |
|
</option> |
|
</component> |
|
<component name="Git.Settings"> |
|
<option name="RECENT_GIT_ROOT_PATH" value="$PROJECT_DIR$" /> |
|
</component> |
|
<component name="MarkdownSettingsMigration"> |
|
<option name="stateVersion" value="1" /> |
|
</component> |
|
<component name="ProjectId" id="24KJYqb7IjKGUSNqPXUOjBSp5gx" /> |
|
<component name="ProjectLevelVcsManager" settingsEditedManually="true" /> |
|
<component name="ProjectViewState"> |
|
<option name="hideEmptyMiddlePackages" value="true" /> |
|
<option name="showLibraryContents" value="true" /> |
|
</component> |
|
<component name="PropertiesComponent"> |
|
<property name="RunOnceActivity.OpenProjectViewOnStart" value="true" /> |
|
<property name="RunOnceActivity.ShowReadmeOnStart" value="true" /> |
|
<property name="WebServerToolWindowFactoryState" value="false" /> |
|
<property name="last_opened_file_path" value="$PROJECT_DIR$/../wav2vec2-base-turkish-artificial-cv" /> |
|
<property name="node.js.detected.package.eslint" value="true" /> |
|
<property name="node.js.detected.package.tslint" value="true" /> |
|
<property name="node.js.selected.package.eslint" value="(autodetect)" /> |
|
<property name="node.js.selected.package.tslint" value="(autodetect)" /> |
|
<property name="settings.editor.selected.configurable" value="com.jetbrains.python.configuration.PyActiveSdkModuleConfigurable" /> |
|
</component> |
|
<component name="RecentsManager"> |
|
<key name="CopyFile.RECENT_KEYS"> |
|
<recent name="$PROJECT_DIR$/language_model" /> |
|
</key> |
|
</component> |
|
<component name="RunManager" selected="Python.eval"> |
|
<configuration name="eval" type="PythonConfigurationType" factoryName="Python" nameIsGenerated="true"> |
|
<module name="wav2vec2-base-turkish" /> |
|
<option name="INTERPRETER_OPTIONS" value="" /> |
|
<option name="PARENT_ENVS" value="true" /> |
|
<envs> |
|
<env name="PYTHONUNBUFFERED" value="1" /> |
|
</envs> |
|
<option name="SDK_HOME" value="" /> |
|
<option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" /> |
|
<option name="IS_MODULE_SDK" value="true" /> |
|
<option name="ADD_CONTENT_ROOTS" value="true" /> |
|
<option name="ADD_SOURCE_ROOTS" value="true" /> |
|
<EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" /> |
|
<option name="SCRIPT_NAME" value="$PROJECT_DIR$/eval.py" /> |
|
<option name="PARAMETERS" value="--model_id cahya/wav2vec2-base-turkish --dataset ./dataset/common_voice --config tr --data_dir /mnt/mldata/data/ASR/turkish/cv-corpus-6.1-2020-12-11 --split test --log_outputs" /> |
|
<option name="SHOW_COMMAND_LINE" value="false" /> |
|
<option name="EMULATE_TERMINAL" value="false" /> |
|
<option name="MODULE_MODE" value="false" /> |
|
<option name="REDIRECT_INPUT" value="false" /> |
|
<option name="INPUT_FILE" value="" /> |
|
<method v="2" /> |
|
</configuration> |
|
<configuration name="ngram" type="PythonConfigurationType" factoryName="Python" temporary="true" nameIsGenerated="true"> |
|
<module name="wav2vec2-base-turkish" /> |
|
<option name="INTERPRETER_OPTIONS" value="" /> |
|
<option name="PARENT_ENVS" value="true" /> |
|
<envs> |
|
<env name="PYTHONUNBUFFERED" value="1" /> |
|
</envs> |
|
<option name="SDK_HOME" value="" /> |
|
<option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" /> |
|
<option name="IS_MODULE_SDK" value="true" /> |
|
<option name="ADD_CONTENT_ROOTS" value="true" /> |
|
<option name="ADD_SOURCE_ROOTS" value="true" /> |
|
<EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" /> |
|
<option name="SCRIPT_NAME" value="$PROJECT_DIR$/ngram.py" /> |
|
<option name="PARAMETERS" value="" /> |
|
<option name="SHOW_COMMAND_LINE" value="false" /> |
|
<option name="EMULATE_TERMINAL" value="false" /> |
|
<option name="MODULE_MODE" value="false" /> |
|
<option name="REDIRECT_INPUT" value="false" /> |
|
<option name="INPUT_FILE" value="" /> |
|
<method v="2" /> |
|
</configuration> |
|
<configuration name="run_speech_recognition_ctc" type="PythonConfigurationType" factoryName="Python" nameIsGenerated="true"> |
|
<module name="wav2vec2-base-turkish" /> |
|
<option name="INTERPRETER_OPTIONS" value="" /> |
|
<option name="PARENT_ENVS" value="true" /> |
|
<envs> |
|
<env name="PYTHONUNBUFFERED" value="1" /> |
|
</envs> |
|
<option name="SDK_HOME" value="" /> |
|
<option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" /> |
|
<option name="IS_MODULE_SDK" value="true" /> |
|
<option name="ADD_CONTENT_ROOTS" value="true" /> |
|
<option name="ADD_SOURCE_ROOTS" value="true" /> |
|
<EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" /> |
|
<option name="SCRIPT_NAME" value="$PROJECT_DIR$/run_speech_recognition_ctc.py" /> |
|
<option name="PARAMETERS" value="--dataset_name="common_voice" --model_name_or_path="cahya/wav2vec2-base-turkish-artificial-cv" --dataset_config_name="tr" --output_dir="./output" --overwrite_output_dir --num_train_epochs="1" --per_device_train_batch_size="2" --per_device_eval_batch_size="2" --gradient_accumulation_steps="4" --learning_rate="7.5e-7" --warmup_steps="2000" --length_column_name="input_length" --evaluation_strategy="steps" --text_column_name="sentence" --save_steps="500" --eval_steps="500" --logging_steps="100" --layerdrop="0.0" --activation_dropout="0.1" --save_total_limit="3" --freeze_feature_encoder --feat_proj_dropout="0.0" --mask_time_prob="0.75" --mask_time_length="10" --mask_feature_prob="0.25" --mask_feature_length="64" --gradient_checkpointing --use_auth_token --fp16=false --group_by_length --do_train=true --do_eval=true --push_to_hub --chars_to_ignore , ? . ! \; \: \"\" \% \' \" \' \' \` … \’ » « \‘ '“' '”' � é û" /> |
|
<option name="SHOW_COMMAND_LINE" value="false" /> |
|
<option name="EMULATE_TERMINAL" value="false" /> |
|
<option name="MODULE_MODE" value="false" /> |
|
<option name="REDIRECT_INPUT" value="false" /> |
|
<option name="INPUT_FILE" value="" /> |
|
<method v="2" /> |
|
</configuration> |
|
<configuration name="test-vocab" type="PythonConfigurationType" factoryName="Python" temporary="true" nameIsGenerated="true"> |
|
<module name="wav2vec2-base-turkish" /> |
|
<option name="INTERPRETER_OPTIONS" value="" /> |
|
<option name="PARENT_ENVS" value="true" /> |
|
<envs> |
|
<env name="PYTHONUNBUFFERED" value="1" /> |
|
</envs> |
|
<option name="SDK_HOME" value="" /> |
|
<option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" /> |
|
<option name="IS_MODULE_SDK" value="true" /> |
|
<option name="ADD_CONTENT_ROOTS" value="true" /> |
|
<option name="ADD_SOURCE_ROOTS" value="true" /> |
|
<EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" /> |
|
<option name="SCRIPT_NAME" value="$PROJECT_DIR$/test-vocab.py" /> |
|
<option name="PARAMETERS" value="" /> |
|
<option name="SHOW_COMMAND_LINE" value="false" /> |
|
<option name="EMULATE_TERMINAL" value="false" /> |
|
<option name="MODULE_MODE" value="false" /> |
|
<option name="REDIRECT_INPUT" value="false" /> |
|
<option name="INPUT_FILE" value="" /> |
|
<method v="2" /> |
|
</configuration> |
|
<recent_temporary> |
|
<list> |
|
<item itemvalue="Python.ngram" /> |
|
<item itemvalue="Python.test-vocab" /> |
|
</list> |
|
</recent_temporary> |
|
</component> |
|
<component name="SpellCheckerSettings" RuntimeDictionaries="0" Folders="0" CustomDictionaries="0" DefaultDictionary="application-level" UseSingleDictionary="true" transferred="true" /> |
|
<component name="TaskManager"> |
|
<task active="true" id="Default" summary="Default task"> |
|
<changelist id="c9169370-1a11-41d7-9648-02694630edd2" name="Changes" comment="" /> |
|
<created>1643373395175</created> |
|
<option name="number" value="Default" /> |
|
<option name="presentableId" value="Default" /> |
|
<updated>1643373395175</updated> |
|
<workItem from="1643373396354" duration="4135000" /> |
|
<workItem from="1643465640987" duration="10417000" /> |
|
<workItem from="1643646039461" duration="615000" /> |
|
<workItem from="1643706833181" duration="7235000" /> |
|
</task> |
|
<task id="LOCAL-00001" summary="update unigrams.txt"> |
|
<created>1643492393885</created> |
|
<option name="number" value="00001" /> |
|
<option name="presentableId" value="LOCAL-00001" /> |
|
<option name="project" value="LOCAL" /> |
|
<updated>1643492393885</updated> |
|
</task> |
|
<task id="LOCAL-00002" summary="Add check_sound.ipynb"> |
|
<created>1643710330931</created> |
|
<option name="number" value="00002" /> |
|
<option name="presentableId" value="LOCAL-00002" /> |
|
<option name="project" value="LOCAL" /> |
|
<updated>1643710330931</updated> |
|
</task> |
|
<option name="localTasksCounter" value="3" /> |
|
<servers /> |
|
</component> |
|
<component name="TypeScriptGeneratedFilesManager"> |
|
<option name="version" value="3" /> |
|
</component> |
|
<component name="VcsManagerConfiguration"> |
|
<MESSAGE value="update unigrams.txt" /> |
|
<MESSAGE value="Add check_sound.ipynb" /> |
|
<option name="LAST_COMMIT_MESSAGE" value="Add check_sound.ipynb" /> |
|
</component> |
|
<component name="XDebuggerManager"> |
|
<breakpoint-manager> |
|
<breakpoints> |
|
<line-breakpoint enabled="true" suspend="THREAD" type="python-line"> |
|
<url>file://$PROJECT_DIR$/run_speech_recognition_ctc.py</url> |
|
<line>747</line> |
|
<option name="timeStamp" value="1" /> |
|
</line-breakpoint> |
|
<line-breakpoint enabled="true" suspend="THREAD" type="python-line"> |
|
<url>file://$PROJECT_DIR$/ngram.py</url> |
|
<line>5</line> |
|
<option name="timeStamp" value="2" /> |
|
</line-breakpoint> |
|
<line-breakpoint enabled="true" suspend="THREAD" type="python-line"> |
|
<url>file://$PROJECT_DIR$/test-vocab.py</url> |
|
<line>5</line> |
|
<option name="timeStamp" value="3" /> |
|
</line-breakpoint> |
|
<line-breakpoint enabled="true" suspend="THREAD" type="python-line"> |
|
<url>file://$PROJECT_DIR$/eval.py</url> |
|
<line>67</line> |
|
<option name="timeStamp" value="4" /> |
|
</line-breakpoint> |
|
<line-breakpoint enabled="true" suspend="THREAD" type="python-line"> |
|
<url>file://$PROJECT_DIR$/eval.py</url> |
|
<line>86</line> |
|
<option name="timeStamp" value="5" /> |
|
</line-breakpoint> |
|
<line-breakpoint enabled="true" suspend="THREAD" type="python-line"> |
|
<url>file://$PROJECT_DIR$/../transformers/src/transformers/pipelines/base.py</url> |
|
<line>1026</line> |
|
<option name="timeStamp" value="6" /> |
|
</line-breakpoint> |
|
<line-breakpoint enabled="true" suspend="THREAD" type="python-line"> |
|
<url>file://$PROJECT_DIR$/../transformers/src/transformers/pipelines/automatic_speech_recognition.py</url> |
|
<line>312</line> |
|
<option name="timeStamp" value="7" /> |
|
</line-breakpoint> |
|
</breakpoints> |
|
</breakpoint-manager> |
|
</component> |
|
<component name="com.intellij.coverage.CoverageDataManagerImpl"> |
|
<SUITE FILE_PATH="coverage/wav2vec2_base_turkish$test_vocab.coverage" NAME="test-vocab Coverage Results" MODIFIED="1643475983769" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" /> |
|
<SUITE FILE_PATH="coverage/wav2vec2_base_turkish$eval.coverage" NAME="eval Coverage Results" MODIFIED="1643720743098" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" /> |
|
<SUITE FILE_PATH="coverage/wav2vec2_base_turkish$ngram.coverage" NAME="ngram Coverage Results" MODIFIED="1643492280791" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" /> |
|
<SUITE FILE_PATH="coverage/wav2vec2_base_turkish$run_speech_recognition_ctc.coverage" NAME="run_speech_recognition_ctc Coverage Results" MODIFIED="1643376049209" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" /> |
|
</component> |
|
</project> |