wav2vec2-base-turkish / .idea /workspace.xml
cahya's picture
Training in progress, step 500
fcbce2b
raw
history blame
No virus
14.1 kB
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="AutoImportSettings">
<option name="autoReloadType" value="SELECTIVE" />
</component>
<component name="ChangeListManager">
<list default="true" id="c9169370-1a11-41d7-9648-02694630edd2" name="Changes" comment="">
<change beforePath="$PROJECT_DIR$/README.md" beforeDir="false" afterPath="$PROJECT_DIR$/README.md" afterDir="false" />
<change beforePath="$PROJECT_DIR$/wav2vec2-base-turkish/preprocessor_config.json" beforeDir="false" afterPath="$PROJECT_DIR$/wav2vec2-base-turkish/preprocessor_config.json" afterDir="false" />
<change beforePath="$PROJECT_DIR$/wav2vec2-base-turkish/special_tokens_map.json" beforeDir="false" afterPath="$PROJECT_DIR$/wav2vec2-base-turkish/special_tokens_map.json" afterDir="false" />
<change beforePath="$PROJECT_DIR$/wav2vec2-base-turkish/tokenizer_config.json" beforeDir="false" afterPath="$PROJECT_DIR$/wav2vec2-base-turkish/tokenizer_config.json" afterDir="false" />
</list>
<option name="SHOW_DIALOG" value="false" />
<option name="HIGHLIGHT_CONFLICTS" value="true" />
<option name="HIGHLIGHT_NON_ACTIVE_CHANGELIST" value="false" />
<option name="LAST_RESOLUTION" value="IGNORE" />
</component>
<component name="FileTemplateManagerImpl">
<option name="RECENT_TEMPLATES">
<list>
<option value="Python Script" />
</list>
</option>
</component>
<component name="Git.Settings">
<option name="RECENT_GIT_ROOT_PATH" value="$PROJECT_DIR$" />
</component>
<component name="MarkdownSettingsMigration">
<option name="stateVersion" value="1" />
</component>
<component name="ProjectId" id="24KJYqb7IjKGUSNqPXUOjBSp5gx" />
<component name="ProjectLevelVcsManager" settingsEditedManually="true" />
<component name="ProjectViewState">
<option name="hideEmptyMiddlePackages" value="true" />
<option name="showLibraryContents" value="true" />
</component>
<component name="PropertiesComponent">
<property name="RunOnceActivity.OpenProjectViewOnStart" value="true" />
<property name="RunOnceActivity.ShowReadmeOnStart" value="true" />
<property name="WebServerToolWindowFactoryState" value="false" />
<property name="last_opened_file_path" value="$PROJECT_DIR$/../wav2vec2-base-turkish-artificial-cv" />
<property name="node.js.detected.package.eslint" value="true" />
<property name="node.js.detected.package.tslint" value="true" />
<property name="node.js.selected.package.eslint" value="(autodetect)" />
<property name="node.js.selected.package.tslint" value="(autodetect)" />
<property name="settings.editor.selected.configurable" value="com.jetbrains.python.configuration.PyActiveSdkModuleConfigurable" />
</component>
<component name="RecentsManager">
<key name="CopyFile.RECENT_KEYS">
<recent name="$PROJECT_DIR$/language_model" />
</key>
</component>
<component name="RunManager" selected="Python.eval">
<configuration name="eval" type="PythonConfigurationType" factoryName="Python" nameIsGenerated="true">
<module name="wav2vec2-base-turkish" />
<option name="INTERPRETER_OPTIONS" value="" />
<option name="PARENT_ENVS" value="true" />
<envs>
<env name="PYTHONUNBUFFERED" value="1" />
</envs>
<option name="SDK_HOME" value="" />
<option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" />
<option name="IS_MODULE_SDK" value="true" />
<option name="ADD_CONTENT_ROOTS" value="true" />
<option name="ADD_SOURCE_ROOTS" value="true" />
<EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
<option name="SCRIPT_NAME" value="$PROJECT_DIR$/eval.py" />
<option name="PARAMETERS" value="--model_id cahya/wav2vec2-base-turkish --dataset ./dataset/common_voice --config tr --data_dir /mnt/mldata/data/ASR/turkish/cv-corpus-6.1-2020-12-11 --split test --log_outputs" />
<option name="SHOW_COMMAND_LINE" value="false" />
<option name="EMULATE_TERMINAL" value="false" />
<option name="MODULE_MODE" value="false" />
<option name="REDIRECT_INPUT" value="false" />
<option name="INPUT_FILE" value="" />
<method v="2" />
</configuration>
<configuration name="ngram" type="PythonConfigurationType" factoryName="Python" temporary="true" nameIsGenerated="true">
<module name="wav2vec2-base-turkish" />
<option name="INTERPRETER_OPTIONS" value="" />
<option name="PARENT_ENVS" value="true" />
<envs>
<env name="PYTHONUNBUFFERED" value="1" />
</envs>
<option name="SDK_HOME" value="" />
<option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" />
<option name="IS_MODULE_SDK" value="true" />
<option name="ADD_CONTENT_ROOTS" value="true" />
<option name="ADD_SOURCE_ROOTS" value="true" />
<EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
<option name="SCRIPT_NAME" value="$PROJECT_DIR$/ngram.py" />
<option name="PARAMETERS" value="" />
<option name="SHOW_COMMAND_LINE" value="false" />
<option name="EMULATE_TERMINAL" value="false" />
<option name="MODULE_MODE" value="false" />
<option name="REDIRECT_INPUT" value="false" />
<option name="INPUT_FILE" value="" />
<method v="2" />
</configuration>
<configuration name="run_speech_recognition_ctc" type="PythonConfigurationType" factoryName="Python" nameIsGenerated="true">
<module name="wav2vec2-base-turkish" />
<option name="INTERPRETER_OPTIONS" value="" />
<option name="PARENT_ENVS" value="true" />
<envs>
<env name="PYTHONUNBUFFERED" value="1" />
</envs>
<option name="SDK_HOME" value="" />
<option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" />
<option name="IS_MODULE_SDK" value="true" />
<option name="ADD_CONTENT_ROOTS" value="true" />
<option name="ADD_SOURCE_ROOTS" value="true" />
<EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
<option name="SCRIPT_NAME" value="$PROJECT_DIR$/run_speech_recognition_ctc.py" />
<option name="PARAMETERS" value="--dataset_name=&quot;common_voice&quot; --model_name_or_path=&quot;cahya/wav2vec2-base-turkish-artificial-cv&quot; --dataset_config_name=&quot;tr&quot; --output_dir=&quot;./output&quot; --overwrite_output_dir --num_train_epochs=&quot;1&quot; --per_device_train_batch_size=&quot;2&quot; --per_device_eval_batch_size=&quot;2&quot; --gradient_accumulation_steps=&quot;4&quot; --learning_rate=&quot;7.5e-7&quot; --warmup_steps=&quot;2000&quot; --length_column_name=&quot;input_length&quot; --evaluation_strategy=&quot;steps&quot; --text_column_name=&quot;sentence&quot; --save_steps=&quot;500&quot; --eval_steps=&quot;500&quot; --logging_steps=&quot;100&quot; --layerdrop=&quot;0.0&quot; --activation_dropout=&quot;0.1&quot; --save_total_limit=&quot;3&quot; --freeze_feature_encoder --feat_proj_dropout=&quot;0.0&quot; --mask_time_prob=&quot;0.75&quot; --mask_time_length=&quot;10&quot; --mask_feature_prob=&quot;0.25&quot; --mask_feature_length=&quot;64&quot; --gradient_checkpointing --use_auth_token --fp16=false --group_by_length --do_train=true --do_eval=true --push_to_hub --chars_to_ignore , ? . ! \; \: \&quot;\&quot; \% \' \&quot; \' \' \` … \’ » « \‘ '“' '”' � é û" />
<option name="SHOW_COMMAND_LINE" value="false" />
<option name="EMULATE_TERMINAL" value="false" />
<option name="MODULE_MODE" value="false" />
<option name="REDIRECT_INPUT" value="false" />
<option name="INPUT_FILE" value="" />
<method v="2" />
</configuration>
<configuration name="test-vocab" type="PythonConfigurationType" factoryName="Python" temporary="true" nameIsGenerated="true">
<module name="wav2vec2-base-turkish" />
<option name="INTERPRETER_OPTIONS" value="" />
<option name="PARENT_ENVS" value="true" />
<envs>
<env name="PYTHONUNBUFFERED" value="1" />
</envs>
<option name="SDK_HOME" value="" />
<option name="WORKING_DIRECTORY" value="$PROJECT_DIR$" />
<option name="IS_MODULE_SDK" value="true" />
<option name="ADD_CONTENT_ROOTS" value="true" />
<option name="ADD_SOURCE_ROOTS" value="true" />
<EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
<option name="SCRIPT_NAME" value="$PROJECT_DIR$/test-vocab.py" />
<option name="PARAMETERS" value="" />
<option name="SHOW_COMMAND_LINE" value="false" />
<option name="EMULATE_TERMINAL" value="false" />
<option name="MODULE_MODE" value="false" />
<option name="REDIRECT_INPUT" value="false" />
<option name="INPUT_FILE" value="" />
<method v="2" />
</configuration>
<recent_temporary>
<list>
<item itemvalue="Python.ngram" />
<item itemvalue="Python.test-vocab" />
</list>
</recent_temporary>
</component>
<component name="SpellCheckerSettings" RuntimeDictionaries="0" Folders="0" CustomDictionaries="0" DefaultDictionary="application-level" UseSingleDictionary="true" transferred="true" />
<component name="TaskManager">
<task active="true" id="Default" summary="Default task">
<changelist id="c9169370-1a11-41d7-9648-02694630edd2" name="Changes" comment="" />
<created>1643373395175</created>
<option name="number" value="Default" />
<option name="presentableId" value="Default" />
<updated>1643373395175</updated>
<workItem from="1643373396354" duration="4135000" />
<workItem from="1643465640987" duration="10417000" />
<workItem from="1643646039461" duration="615000" />
<workItem from="1643706833181" duration="7235000" />
</task>
<task id="LOCAL-00001" summary="update unigrams.txt">
<created>1643492393885</created>
<option name="number" value="00001" />
<option name="presentableId" value="LOCAL-00001" />
<option name="project" value="LOCAL" />
<updated>1643492393885</updated>
</task>
<task id="LOCAL-00002" summary="Add check_sound.ipynb">
<created>1643710330931</created>
<option name="number" value="00002" />
<option name="presentableId" value="LOCAL-00002" />
<option name="project" value="LOCAL" />
<updated>1643710330931</updated>
</task>
<option name="localTasksCounter" value="3" />
<servers />
</component>
<component name="TypeScriptGeneratedFilesManager">
<option name="version" value="3" />
</component>
<component name="VcsManagerConfiguration">
<MESSAGE value="update unigrams.txt" />
<MESSAGE value="Add check_sound.ipynb" />
<option name="LAST_COMMIT_MESSAGE" value="Add check_sound.ipynb" />
</component>
<component name="XDebuggerManager">
<breakpoint-manager>
<breakpoints>
<line-breakpoint enabled="true" suspend="THREAD" type="python-line">
<url>file://$PROJECT_DIR$/run_speech_recognition_ctc.py</url>
<line>747</line>
<option name="timeStamp" value="1" />
</line-breakpoint>
<line-breakpoint enabled="true" suspend="THREAD" type="python-line">
<url>file://$PROJECT_DIR$/ngram.py</url>
<line>5</line>
<option name="timeStamp" value="2" />
</line-breakpoint>
<line-breakpoint enabled="true" suspend="THREAD" type="python-line">
<url>file://$PROJECT_DIR$/test-vocab.py</url>
<line>5</line>
<option name="timeStamp" value="3" />
</line-breakpoint>
<line-breakpoint enabled="true" suspend="THREAD" type="python-line">
<url>file://$PROJECT_DIR$/eval.py</url>
<line>67</line>
<option name="timeStamp" value="4" />
</line-breakpoint>
<line-breakpoint enabled="true" suspend="THREAD" type="python-line">
<url>file://$PROJECT_DIR$/eval.py</url>
<line>86</line>
<option name="timeStamp" value="5" />
</line-breakpoint>
<line-breakpoint enabled="true" suspend="THREAD" type="python-line">
<url>file://$PROJECT_DIR$/../transformers/src/transformers/pipelines/base.py</url>
<line>1026</line>
<option name="timeStamp" value="6" />
</line-breakpoint>
<line-breakpoint enabled="true" suspend="THREAD" type="python-line">
<url>file://$PROJECT_DIR$/../transformers/src/transformers/pipelines/automatic_speech_recognition.py</url>
<line>312</line>
<option name="timeStamp" value="7" />
</line-breakpoint>
</breakpoints>
</breakpoint-manager>
</component>
<component name="com.intellij.coverage.CoverageDataManagerImpl">
<SUITE FILE_PATH="coverage/wav2vec2_base_turkish$test_vocab.coverage" NAME="test-vocab Coverage Results" MODIFIED="1643475983769" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
<SUITE FILE_PATH="coverage/wav2vec2_base_turkish$eval.coverage" NAME="eval Coverage Results" MODIFIED="1643720743098" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
<SUITE FILE_PATH="coverage/wav2vec2_base_turkish$ngram.coverage" NAME="ngram Coverage Results" MODIFIED="1643492280791" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
<SUITE FILE_PATH="coverage/wav2vec2_base_turkish$run_speech_recognition_ctc.coverage" NAME="run_speech_recognition_ctc Coverage Results" MODIFIED="1643376049209" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="true" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
</component>
</project>